[llvm] r326584 - [ARM] Fix access to stack arguments when re-aligning SP in Armv6m

Momchil Velikov via llvm-commits llvm-commits at lists.llvm.org
Fri Mar 2 07:47:15 PST 2018


Author: chill
Date: Fri Mar  2 07:47:14 2018
New Revision: 326584

URL: http://llvm.org/viewvc/llvm-project?rev=326584&view=rev
Log:
[ARM] Fix access to stack arguments when re-aligning SP in Armv6m

When an Armv6m function dynamically re-aligns the stack, access to incoming
stack arguments (and to stack area, allocated for register varargs) is done via
SP, which is incorrect, as the SP is offset by an unknown amount relative to the
value of SP upon function entry.

This patch fixes it, by making access to "fixed" frame objects be done via FP
when the function needs stack re-alignment.  It also changes the access to
"fixed" frame objects be done via FP (instead of using R6/BP) also for the case
when the stack frame contains variable sized objects. This should allow more
objects to fit within the immediate offset of the load instruction.

All of the above via a small refactoring to reuse the existing
`ARMFrameLowering::ResolveFrameIndexReference.`

Differential Revision: https://reviews.llvm.org/D43566

Added:
    llvm/trunk/test/CodeGen/Thumb/frame-access.ll
Modified:
    llvm/trunk/lib/Target/ARM/ARMFrameLowering.cpp
    llvm/trunk/lib/Target/ARM/ThumbRegisterInfo.cpp

Modified: llvm/trunk/lib/Target/ARM/ARMFrameLowering.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ARMFrameLowering.cpp?rev=326584&r1=326583&r2=326584&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ARMFrameLowering.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ARMFrameLowering.cpp Fri Mar  2 07:47:14 2018
@@ -919,15 +919,17 @@ ARMFrameLowering::ResolveFrameIndexRefer
           return FPOffset;
         }
       }
-    } else if (AFI->isThumb2Function()) {
+    } else if (AFI->isThumbFunction()) {
+      // Prefer SP to base pointer, if the offset is suitably aligned and in
+      // range as the effective range of the immediate offset is bigger when
+      // basing off SP.
       // Use  add <rd>, sp, #<imm8>
       //      ldr <rd>, [sp, #<imm8>]
-      // if at all possible to save space.
       if (Offset >= 0 && (Offset & 3) == 0 && Offset <= 1020)
         return Offset;
       // In Thumb2 mode, the negative offset is very limited. Try to avoid
       // out of range references. ldr <rt>,[<rn>, #-<imm8>]
-      if (FPOffset >= -255 && FPOffset < 0) {
+      if (AFI->isThumb2Function() && FPOffset >= -255 && FPOffset < 0) {
         FrameReg = RegInfo->getFrameRegister(MF);
         return FPOffset;
       }

Modified: llvm/trunk/lib/Target/ARM/ThumbRegisterInfo.cpp
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/lib/Target/ARM/ThumbRegisterInfo.cpp?rev=326584&r1=326583&r2=326584&view=diff
==============================================================================
--- llvm/trunk/lib/Target/ARM/ThumbRegisterInfo.cpp (original)
+++ llvm/trunk/lib/Target/ARM/ThumbRegisterInfo.cpp Fri Mar  2 07:47:14 2018
@@ -521,21 +521,10 @@ void ThumbRegisterInfo::eliminateFrameIn
   DebugLoc dl = MI.getDebugLoc();
   MachineInstrBuilder MIB(*MBB.getParent(), &MI);
 
-  unsigned FrameReg = ARM::SP;
+  unsigned FrameReg;
   int FrameIndex = MI.getOperand(FIOperandNum).getIndex();
-  int Offset = MF.getFrameInfo().getObjectOffset(FrameIndex) +
-               MF.getFrameInfo().getStackSize() + SPAdj;
-
-  if (MF.getFrameInfo().hasVarSizedObjects()) {
-    assert(SPAdj == 0 && STI.getFrameLowering()->hasFP(MF) && "Unexpected");
-    // There are alloca()'s in this function, must reference off the frame
-    // pointer or base pointer instead.
-    if (!hasBasePointer(MF)) {
-      FrameReg = getFrameRegister(MF);
-      Offset -= AFI->getFramePtrSpillOffset();
-    } else
-      FrameReg = BasePtr;
-  }
+  const ARMFrameLowering *TFI = getFrameLowering(MF);
+  int Offset = TFI->ResolveFrameIndexReference(MF, FrameIndex, FrameReg, SPAdj);
 
   // PEI::scavengeFrameVirtualRegs() cannot accurately track SPAdj because the
   // call frame setup/destroy instructions have already been eliminated.  That

Added: llvm/trunk/test/CodeGen/Thumb/frame-access.ll
URL: http://llvm.org/viewvc/llvm-project/llvm/trunk/test/CodeGen/Thumb/frame-access.ll?rev=326584&view=auto
==============================================================================
--- llvm/trunk/test/CodeGen/Thumb/frame-access.ll (added)
+++ llvm/trunk/test/CodeGen/Thumb/frame-access.ll Fri Mar  2 07:47:14 2018
@@ -0,0 +1,416 @@
+; RUN: llc -mtriple=thumbv6m-eabi -disable-fp-elim=false %s -o - | FileCheck %s
+
+; struct S { int x[128]; } s;
+; int f(int *, int, int, int, struct S);
+; int g(int *, int, int, int, int, int);
+; int h(int *, int *, int *);
+; int u(int *, int *, int *, struct S, struct S);
+
+%struct.S = type { [128 x i32] }
+%struct.__va_list = type { i8* }
+
+ at s = common dso_local global %struct.S zeroinitializer, align 4
+
+declare void @llvm.va_start(i8*)
+declare dso_local i32 @g(i32*, i32, i32, i32, i32, i32) local_unnamed_addr
+declare dso_local i32 @f(i32*, i32, i32, i32, %struct.S* byval align 4) local_unnamed_addr
+declare dso_local i32 @h(i32*, i32*, i32*) local_unnamed_addr
+declare dso_local i32 @u(i32*, i32*, i32*, %struct.S* byval align 4, %struct.S* byval align 4) local_unnamed_addr
+
+;
+; Test access to arguments, passed on stack (including varargs)
+;
+
+; Usual case, access via SP
+; int test_args_sp(int a, int b, int c, int d, int e) {
+;   int v[4];
+;   return g(v, a, b, c, d, e);
+; }
+define dso_local i32 @test_args_sp(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr {
+entry:
+  %v = alloca [4 x i32], align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
+  ret i32 %call
+}
+; CHECK-LABEL: test_args_sp
+; Load `e`
+; CHECK:       ldr    r0, [sp, #40]
+; CHECK-NEXT:  mov    r5, sp
+; CHECK-NEXT:  str    r3, [r5]
+; Pass `e` on stack
+; CHECK-NEXT:  str    r0, [r5, #4]
+; CHECK:       bl    g
+
+; int test_varargs_sp(int a, ...) {
+;   int v[4];
+;   __builtin_va_list ap;
+;   __builtin_va_start(ap, a);
+;   return g(v, a, 0, 0, 0, 0);
+; }
+define dso_local i32 @test_varargs_sp(i32 %a, ...) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 4
+  %ap = alloca %struct.__va_list, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast %struct.__va_list* %ap to i8*
+  call void @llvm.va_start(i8* nonnull %1)
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, i32 0, i32 0)
+  ret i32 %call
+}
+; CHECK-LABEL: test_varargs_sp
+; Three incoming varargs in registers
+; CHECK:       sub sp, #12
+; CHECK:       sub sp, #28
+; Incoming arguments area is accessed via SP
+; CHECK:       add r0, sp, #36
+; CHECK:       stm r0!, {r1, r2, r3}
+
+; Re-aligned stack, access via FP
+; int test_args_realign(int a, int b, int c, int d, int e) {
+;   __attribute__((aligned(16))) int v[4];
+;   return g(v, a, b, c, d, e);
+; }
+; Function Attrs: nounwind
+define dso_local i32 @test_args_realign(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 16
+  %0 = bitcast [4 x i32]* %v to i8*
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
+  ret i32 %call
+}
+; CHECK-LABEL: test_args_realign
+; Setup frame pointer
+; CHECK:       add r7, sp, #8
+; Align stack
+; CHECK:       mov  r4, sp
+; CHECK-NEXT:  lsrs r4, r4, #4
+; CHECK-NEXT:  lsls r4, r4, #4
+; CHECK-NEXT:  mov  sp, r4
+; Load `e` via FP
+; CHECK:       ldr r0, [r7, #8]
+; CHECK-NEXT:  mov r5, sp
+; CHECK-NEXT:  str r3, [r5]
+; Pass `e` as argument
+; CHECK-NEXT:  str r0, [r5, #4]
+; CHECK:       bl    g
+
+; int test_varargs_realign(int a, ...) {
+;   __attribute__((aligned(16))) int v[4];
+;   __builtin_va_list ap;
+;   __builtin_va_start(ap, a);
+;   return g(v, a, 0, 0, 0, 0);
+; }
+define dso_local i32 @test_varargs_realign(i32 %a, ...) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 16
+  %ap = alloca %struct.__va_list, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast %struct.__va_list* %ap to i8*
+  call void @llvm.va_start(i8* nonnull %1)
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, i32 0, i32 0)
+  ret i32 %call
+}
+; CHECK-LABEL: test_varargs_realign
+; Three incoming register varargs
+; CHECK:       sub sp, #12
+; Setup frame pointer
+; CHECK:       add r7, sp, #8
+; Align stack
+; CHECK:       mov  r4, sp
+; CHECK-NEXT:  lsrs r4, r4, #4
+; CHECK-NEXT:  lsls r4, r4, #4
+; CHECK-NEXT:  mov  sp, r4
+; Incoming register varargs stored via FP
+; CHECK:       str r3, [r7, #16]
+; CHECK-NEXT:  str r2, [r7, #12]
+; CHECK-NEXT:  str r1, [r7, #8]
+
+; VLAs present, access via FP
+; int test_args_vla(int a, int b, int c, int d, int e) {
+;   int v[a];
+;   return g(v, a, b, c, d, e);
+; }
+define dso_local i32 @test_args_vla(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr  {
+entry:
+  %vla = alloca i32, i32 %a, align 4
+  %call = call i32 @g(i32* nonnull %vla, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
+  ret i32 %call
+}
+; CHECK-LABEL: test_args_vla
+; Setup frame pointer
+; CHECK:       add r7, sp, #12
+; Allocate outgoing stack arguments space
+; CHECK:       sub sp, #4
+; Load `e` via FP
+; CHECK:       ldr r5, [r7, #8]
+; CHECK-NEXT:  mov r0, sp
+; Pass `d` and `e` as arguments
+; CHECK-NEXT:  stm r0!, {r3, r5}
+; CHECK:       bl  g
+
+; int test_varargs_vla(int a, ...) {
+;   int v[a];
+;   __builtin_va_list ap;
+;   __builtin_va_start(ap, a);
+;   return g(v, a, 0, 0, 0, 0);
+; }
+define dso_local i32 @test_varargs_vla(i32 %a, ...) local_unnamed_addr  {
+entry:
+  %ap = alloca %struct.__va_list, align 4
+  %vla = alloca i32, i32 %a, align 4
+  %0 = bitcast %struct.__va_list* %ap to i8*
+  call void @llvm.va_start(i8* nonnull %0)
+  %call = call i32 @g(i32* nonnull %vla, i32 %a, i32 0, i32 0, i32 0, i32 0)
+  ret i32 %call
+}
+; CHECK-LABEL: test_varargs_vla
+; Three incoming register varargs
+; CHECK:       sub sp, #12
+; Setup frame pointer
+; CHECK:       add r7, sp, #8
+; Register varargs stored via FP
+; CHECK:       str r3, [r7, #16]
+; CHECK-NEXT:  str r2, [r7, #12]
+; CHECK-NEXT:  str r1, [r7, #8]
+
+; Moving SP, access via SP
+; int test_args_moving_sp(int a, int b, int c, int d, int e) {
+;   int v[4];
+;   return f(v, a, b + c + d, e, s) + h(v, v+1, v+2);
+; }
+define dso_local i32 @test_args_moving_sp(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %add = add nsw i32 %c, %b
+  %add1 = add nsw i32 %add, %d
+  %call = call i32 @f(i32* nonnull %arraydecay, i32 %a, i32 %add1, i32 %e, %struct.S* byval nonnull align 4 @s)
+  %add.ptr = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 1
+  %add.ptr5 = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 2
+  %call6 = call i32 @h(i32* nonnull %arraydecay, i32* nonnull %add.ptr, i32* nonnull %add.ptr5)
+  %add7 = add nsw i32 %call6, %call
+  ret i32 %add7
+}
+; CHECK-LABEL: test_args_moving_sp
+; 20 bytes callee-saved area
+; CHECK:       push {r4, r5, r6, r7, lr}
+; 20 bytes locals
+; CHECK:       sub sp, #20
+; Allocate outgoing arguments space
+; CHECK:       sub sp, #508
+; CHECK:       sub sp, #4
+; Load `e` via SP, 552 = 512 + 20 + 20
+; CHECK:       ldr r3, [sp, #552]
+; CHECK:       bl  f
+; Stack restored before next call
+; CHECK-NEXT:  add sp, #508
+; CHECK-NEXT:  add sp, #4
+; CHECK:       bl  h
+
+; int test_varargs_moving_sp(int a, ...) {
+;   int v[4];
+;   __builtin_va_list ap;
+;   __builtin_va_start(ap, a);
+;   return f(v, a, 0, 0, s) + h(v, v+1, v+2);
+; }
+define dso_local i32 @test_varargs_moving_sp(i32 %a, ...) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 4
+  %ap = alloca %struct.__va_list, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast %struct.__va_list* %ap to i8*
+  call void @llvm.va_start(i8* nonnull %1)
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @f(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, %struct.S* byval nonnull align 4 @s)
+  %add.ptr = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 1
+  %add.ptr5 = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 2
+  %call6 = call i32 @h(i32* nonnull %arraydecay, i32* nonnull %add.ptr, i32* nonnull %add.ptr5)
+  %add = add nsw i32 %call6, %call
+  ret i32 %add
+}
+; CHECK-LABEL: test_varargs_moving_sp
+; Three incoming register varargs
+; CHECK:       sub sp, #12
+; 16 bytes callee-saves
+; CHECK:       push {r4, r5, r7, lr}
+; 20 bytes locals
+; CHECK:       sub sp, #20
+; Incoming varargs stored via SP, 36 = 20 + 16
+; CHECK:       add r0, sp, #36
+; CHECK-NEXT:  stm r0!, {r1, r2, r3}
+
+;
+; Access to locals
+;
+
+; Usual case, access via SP.
+; int test_local(int n) {
+;   int v[4];
+;   int x, y, z;
+;   h(&x, &y, &z);
+;   return g(v, x, y, z, 0, 0);
+; }
+define dso_local i32 @test_local(i32 %n) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 4
+  %x = alloca i32, align 4
+  %y = alloca i32, align 4
+  %z = alloca i32, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast i32* %x to i8*
+  %2 = bitcast i32* %y to i8*
+  %3 = bitcast i32* %z to i8*
+  %call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %4 = load i32, i32* %x, align 4
+  %5 = load i32, i32* %y, align 4
+  %6 = load i32, i32* %z, align 4
+  %call1 = call i32 @g(i32* nonnull %arraydecay, i32 %4, i32 %5, i32 %6, i32 0, i32 0)
+  ret i32 %call1
+}
+; CHECK-LABEL: test_local
+; Arguments to `h` relative to SP
+; CHECK:       add r0, sp, #20
+; CHECK-NEXT:  add r1, sp, #16
+; CHECK-NEXT:  add r2, sp, #12
+; CHECK-NEXT:  bl  h
+; Load `x`, `y`, and `z` via SP
+; CHECK:       ldr r1, [sp, #20]
+; CHECK-NEXT:  ldr r2, [sp, #16]
+; CHECK-NEXT:  ldr r3, [sp, #12]
+; CHECK:       bl  g
+
+; Re-aligned stack, access via SP.
+; int test_local_realign(int n) {
+;   __attribute__((aligned(16))) int v[4];
+;   int x, y, z;
+;   h(&x, &y, &z);
+;   return g(v, x, y, z, 0, 0);
+; }
+define dso_local i32 @test_local_realign(i32 %n) local_unnamed_addr  {
+entry:
+  %v = alloca [4 x i32], align 16
+  %x = alloca i32, align 4
+  %y = alloca i32, align 4
+  %z = alloca i32, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast i32* %x to i8*
+  %2 = bitcast i32* %y to i8*
+  %3 = bitcast i32* %z to i8*
+  %call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %4 = load i32, i32* %x, align 4
+  %5 = load i32, i32* %y, align 4
+  %6 = load i32, i32* %z, align 4
+  %call1 = call i32 @g(i32* nonnull %arraydecay, i32 %4, i32 %5, i32 %6, i32 0, i32 0)
+  ret i32 %call1
+}
+; CHECK-LABEL: test_local_realign
+; Setup frame pointer
+; CHECK:       add r7, sp, #8
+; Re-align stack
+; CHECK:       mov r4, sp
+; CHECK-NEXT:  lsrs r4, r4, #4
+; CHECK-NEXT:  lsls r4, r4, #4
+; CHECK-NEXT:  mov  sp, r4
+; Arguments to `h` computed relative to SP
+; CHECK:       add r0, sp, #28
+; CHECK-NEXT:  add r1, sp, #24
+; CHECK-NEXT:  add r2, sp, #20
+; CHECK-NEXT:  bl  h
+; Load `x`, `y`, and `z` via SP for passing to `g`
+; CHECK:       ldr r1, [sp, #28]
+; CHECK-NEXT:  ldr r2, [sp, #24]
+; CHECK-NEXT:  ldr r3, [sp, #20]
+; CHECK:       bl  g
+
+; VLAs, access via BP.
+; int test_local_vla(int n) {
+;   int v[n];
+;   int x, y, z;
+;   h(&x, &y, &z);
+;   return g(v, x, y, z, 0, 0);
+; }
+define dso_local i32 @test_local_vla(i32 %n) local_unnamed_addr  {
+entry:
+  %x = alloca i32, align 4
+  %y = alloca i32, align 4
+  %z = alloca i32, align 4
+  %vla = alloca i32, i32 %n, align 4
+  %0 = bitcast i32* %x to i8*
+  %1 = bitcast i32* %y to i8*
+  %2 = bitcast i32* %z to i8*
+  %call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
+  %3 = load i32, i32* %x, align 4
+  %4 = load i32, i32* %y, align 4
+  %5 = load i32, i32* %z, align 4
+  %call1 = call i32 @g(i32* nonnull %vla, i32 %3, i32 %4, i32 %5, i32 0, i32 0)
+  ret i32 %call1
+}
+; CHECK-LABEL: test_local_vla
+; Setup frame pointer
+; CHECK:       add  r7, sp, #12
+; Setup base pointer
+; CHECK:       mov  r6, sp
+; CHECK:       mov  r5, r6
+; Arguments to `h` compute relative to BP
+; CHECK:       adds r0, r6, #7
+; CHECK-NEXT:  adds r0, #1
+; CHECK-NEXT:  adds r1, r6, #4
+; CHECK-NEXT:  mov  r2, r6
+; CHECK-NEXT:  bl   h
+; Load `x`, `y`, `z` via BP (r5 should still have the value of r6 from the move
+; above)
+; CHECK:       ldr r3, [r5]
+; CHECK-NEXT:  ldr r2, [r5, #4]
+; CHECK-NEXT:  ldr r1, [r5, #8]
+; CHECK:       bl  g
+
+;  Moving SP, access via SP.
+; int test_local_moving_sp(int n) {
+;   int v[4];
+;   int x, y, z;
+;   return u(v, &x, &y, s, s) + u(v, &y, &z, s, s);
+; }
+define dso_local i32 @test_local_moving_sp(i32 %n) local_unnamed_addr {
+entry:
+  %v = alloca [4 x i32], align 4
+  %x = alloca i32, align 4
+  %y = alloca i32, align 4
+  %z = alloca i32, align 4
+  %0 = bitcast [4 x i32]* %v to i8*
+  %1 = bitcast i32* %x to i8*
+  %2 = bitcast i32* %y to i8*
+  %3 = bitcast i32* %z to i8*
+  %arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
+  %call = call i32 @u(i32* nonnull %arraydecay, i32* nonnull %x, i32* nonnull %y, %struct.S* byval nonnull align 4 @s, %struct.S* byval nonnull align 4 @s)
+  %call2 = call i32 @u(i32* nonnull %arraydecay, i32* nonnull %y, i32* nonnull %z, %struct.S* byval nonnull align 4 @s, %struct.S* byval nonnull align 4 @s)
+  %add = add nsw i32 %call2, %call
+  ret i32 %add
+}
+; CHECK-LABEL: test_local_moving_sp
+; Locals area
+; CHECK:      sub sp, #36
+; Outoging arguments
+; CHECK:      sub sp, #508
+; CHECK-NEXT: sub sp, #508
+; CHECK-NEXT: sub sp, #8
+; Argument addresses computed relative to SP
+; CHECK:      add  r4, sp, #1020
+; CHECK-NEXT: adds r4, #24
+; CHECK:      add  r1, sp, #1020
+; CHECK-NEXT: adds r1, #20
+; CHECK:      add  r5, sp, #1020
+; CHECK-NEXT: adds r5, #16
+; CHECK:      bl   u
+; Stack restored before next call
+; CHECK:      add  sp, #508
+; CHECK-NEXT: add  sp, #508
+; CHECK-NEXT: add  sp, #8
+; CHECK:      bl   u




More information about the llvm-commits mailing list