blob: 7b6f5ba3eac29934c7a8aa1414fcd35b90b1e128 [file] [log] [blame]
; RUN: llc -mtriple=thumbv6m-eabi -disable-fp-elim=false %s -o - | FileCheck %s
; struct S { int x[128]; } s;
; int f(int *, int, int, int, struct S);
; int g(int *, int, int, int, int, int);
; int h(int *, int *, int *);
; int u(int *, int *, int *, struct S, struct S);
%struct.S = type { [128 x i32] }
%struct.__va_list = type { i8* }
@s = common dso_local global %struct.S zeroinitializer, align 4
declare void @llvm.va_start(i8*)
declare dso_local i32 @g(i32*, i32, i32, i32, i32, i32) local_unnamed_addr
declare dso_local i32 @f(i32*, i32, i32, i32, %struct.S* byval align 4) local_unnamed_addr
declare dso_local i32 @h(i32*, i32*, i32*) local_unnamed_addr
declare dso_local i32 @u(i32*, i32*, i32*, %struct.S* byval align 4, %struct.S* byval align 4) local_unnamed_addr
;
; Test access to arguments, passed on stack (including varargs)
;
; Usual case, access via SP
; int test_args_sp(int a, int b, int c, int d, int e) {
; int v[4];
; return g(v, a, b, c, d, e);
; }
define dso_local i32 @test_args_sp(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%0 = bitcast [4 x i32]* %v to i8*
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
ret i32 %call
}
; CHECK-LABEL: test_args_sp
; Load `e`
; CHECK: ldr r0, [sp, #40]
; CHECK-NEXT: mov r5, sp
; CHECK-NEXT: str r3, [r5]
; Pass `e` on stack
; CHECK-NEXT: str r0, [r5, #4]
; CHECK: bl g
; int test_varargs_sp(int a, ...) {
; int v[4];
; __builtin_va_list ap;
; __builtin_va_start(ap, a);
; return g(v, a, 0, 0, 0, 0);
; }
define dso_local i32 @test_varargs_sp(i32 %a, ...) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%ap = alloca %struct.__va_list, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast %struct.__va_list* %ap to i8*
call void @llvm.va_start(i8* nonnull %1)
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, i32 0, i32 0)
ret i32 %call
}
; CHECK-LABEL: test_varargs_sp
; Three incoming varargs in registers
; CHECK: sub sp, #12
; CHECK: sub sp, #28
; Incoming arguments area is accessed via SP
; CHECK: add r0, sp, #36
; CHECK: stm r0!, {r1, r2, r3}
; Re-aligned stack, access via FP
; int test_args_realign(int a, int b, int c, int d, int e) {
; __attribute__((aligned(16))) int v[4];
; return g(v, a, b, c, d, e);
; }
; Function Attrs: nounwind
define dso_local i32 @test_args_realign(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 16
%0 = bitcast [4 x i32]* %v to i8*
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
ret i32 %call
}
; CHECK-LABEL: test_args_realign
; Setup frame pointer
; CHECK: add r7, sp, #8
; Align stack
; CHECK: mov r4, sp
; CHECK-NEXT: lsrs r4, r4, #4
; CHECK-NEXT: lsls r4, r4, #4
; CHECK-NEXT: mov sp, r4
; Load `e` via FP
; CHECK: ldr r0, [r7, #8]
; CHECK-NEXT: mov r5, sp
; CHECK-NEXT: str r3, [r5]
; Pass `e` as argument
; CHECK-NEXT: str r0, [r5, #4]
; CHECK: bl g
; int test_varargs_realign(int a, ...) {
; __attribute__((aligned(16))) int v[4];
; __builtin_va_list ap;
; __builtin_va_start(ap, a);
; return g(v, a, 0, 0, 0, 0);
; }
define dso_local i32 @test_varargs_realign(i32 %a, ...) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 16
%ap = alloca %struct.__va_list, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast %struct.__va_list* %ap to i8*
call void @llvm.va_start(i8* nonnull %1)
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @g(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, i32 0, i32 0)
ret i32 %call
}
; CHECK-LABEL: test_varargs_realign
; Three incoming register varargs
; CHECK: sub sp, #12
; Setup frame pointer
; CHECK: add r7, sp, #8
; Align stack
; CHECK: mov r4, sp
; CHECK-NEXT: lsrs r4, r4, #4
; CHECK-NEXT: lsls r4, r4, #4
; CHECK-NEXT: mov sp, r4
; Incoming register varargs stored via FP
; CHECK: str r3, [r7, #16]
; CHECK-NEXT: str r2, [r7, #12]
; CHECK-NEXT: str r1, [r7, #8]
; VLAs present, access via FP
; int test_args_vla(int a, int b, int c, int d, int e) {
; int v[a];
; return g(v, a, b, c, d, e);
; }
define dso_local i32 @test_args_vla(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr {
entry:
%vla = alloca i32, i32 %a, align 4
%call = call i32 @g(i32* nonnull %vla, i32 %a, i32 %b, i32 %c, i32 %d, i32 %e)
ret i32 %call
}
; CHECK-LABEL: test_args_vla
; Setup frame pointer
; CHECK: add r7, sp, #12
; Allocate outgoing stack arguments space
; CHECK: sub sp, #4
; Load `e` via FP
; CHECK: ldr r5, [r7, #8]
; CHECK-NEXT: mov r0, sp
; Pass `d` and `e` as arguments
; CHECK-NEXT: stm r0!, {r3, r5}
; CHECK: bl g
; int test_varargs_vla(int a, ...) {
; int v[a];
; __builtin_va_list ap;
; __builtin_va_start(ap, a);
; return g(v, a, 0, 0, 0, 0);
; }
define dso_local i32 @test_varargs_vla(i32 %a, ...) local_unnamed_addr {
entry:
%ap = alloca %struct.__va_list, align 4
%vla = alloca i32, i32 %a, align 4
%0 = bitcast %struct.__va_list* %ap to i8*
call void @llvm.va_start(i8* nonnull %0)
%call = call i32 @g(i32* nonnull %vla, i32 %a, i32 0, i32 0, i32 0, i32 0)
ret i32 %call
}
; CHECK-LABEL: test_varargs_vla
; Three incoming register varargs
; CHECK: sub sp, #12
; Setup frame pointer
; CHECK: add r7, sp, #8
; Register varargs stored via FP
; CHECK: str r3, [r7, #16]
; CHECK-NEXT: str r2, [r7, #12]
; CHECK-NEXT: str r1, [r7, #8]
; Moving SP, access via SP
; int test_args_moving_sp(int a, int b, int c, int d, int e) {
; int v[4];
; return f(v, a, b + c + d, e, s) + h(v, v+1, v+2);
; }
define dso_local i32 @test_args_moving_sp(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%0 = bitcast [4 x i32]* %v to i8*
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%add = add nsw i32 %c, %b
%add1 = add nsw i32 %add, %d
%call = call i32 @f(i32* nonnull %arraydecay, i32 %a, i32 %add1, i32 %e, %struct.S* byval nonnull align 4 @s)
%add.ptr = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 1
%add.ptr5 = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 2
%call6 = call i32 @h(i32* nonnull %arraydecay, i32* nonnull %add.ptr, i32* nonnull %add.ptr5)
%add7 = add nsw i32 %call6, %call
ret i32 %add7
}
; CHECK-LABEL: test_args_moving_sp
; 20 bytes callee-saved area
; CHECK: push {r4, r5, r6, r7, lr}
; 20 bytes locals
; CHECK: sub sp, #20
; Allocate outgoing arguments space
; CHECK: sub sp, #508
; CHECK: sub sp, #4
; Load `e` via SP, 552 = 512 + 20 + 20
; CHECK: ldr r3, [sp, #552]
; CHECK: bl f
; Stack restored before next call
; CHECK-NEXT: add sp, #508
; CHECK-NEXT: add sp, #4
; CHECK: bl h
; int test_varargs_moving_sp(int a, ...) {
; int v[4];
; __builtin_va_list ap;
; __builtin_va_start(ap, a);
; return f(v, a, 0, 0, s) + h(v, v+1, v+2);
; }
define dso_local i32 @test_varargs_moving_sp(i32 %a, ...) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%ap = alloca %struct.__va_list, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast %struct.__va_list* %ap to i8*
call void @llvm.va_start(i8* nonnull %1)
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @f(i32* nonnull %arraydecay, i32 %a, i32 0, i32 0, %struct.S* byval nonnull align 4 @s)
%add.ptr = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 1
%add.ptr5 = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 2
%call6 = call i32 @h(i32* nonnull %arraydecay, i32* nonnull %add.ptr, i32* nonnull %add.ptr5)
%add = add nsw i32 %call6, %call
ret i32 %add
}
; CHECK-LABEL: test_varargs_moving_sp
; Three incoming register varargs
; CHECK: sub sp, #12
; 16 bytes callee-saves
; CHECK: push {r4, r5, r7, lr}
; 20 bytes locals
; CHECK: sub sp, #20
; Incoming varargs stored via SP, 36 = 20 + 16
; CHECK: add r0, sp, #36
; CHECK-NEXT: stm r0!, {r1, r2, r3}
;
; Access to locals
;
; Usual case, access via SP.
; int test_local(int n) {
; int v[4];
; int x, y, z;
; h(&x, &y, &z);
; return g(v, x, y, z, 0, 0);
; }
define dso_local i32 @test_local(i32 %n) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%x = alloca i32, align 4
%y = alloca i32, align 4
%z = alloca i32, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast i32* %x to i8*
%2 = bitcast i32* %y to i8*
%3 = bitcast i32* %z to i8*
%call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%4 = load i32, i32* %x, align 4
%5 = load i32, i32* %y, align 4
%6 = load i32, i32* %z, align 4
%call1 = call i32 @g(i32* nonnull %arraydecay, i32 %4, i32 %5, i32 %6, i32 0, i32 0)
ret i32 %call1
}
; CHECK-LABEL: test_local
; Arguments to `h` relative to SP
; CHECK: add r0, sp, #20
; CHECK-NEXT: add r1, sp, #16
; CHECK-NEXT: add r2, sp, #12
; CHECK-NEXT: bl h
; Load `x`, `y`, and `z` via SP
; CHECK: ldr r1, [sp, #20]
; CHECK-NEXT: ldr r2, [sp, #16]
; CHECK-NEXT: ldr r3, [sp, #12]
; CHECK: bl g
; Re-aligned stack, access via SP.
; int test_local_realign(int n) {
; __attribute__((aligned(16))) int v[4];
; int x, y, z;
; h(&x, &y, &z);
; return g(v, x, y, z, 0, 0);
; }
define dso_local i32 @test_local_realign(i32 %n) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 16
%x = alloca i32, align 4
%y = alloca i32, align 4
%z = alloca i32, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast i32* %x to i8*
%2 = bitcast i32* %y to i8*
%3 = bitcast i32* %z to i8*
%call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%4 = load i32, i32* %x, align 4
%5 = load i32, i32* %y, align 4
%6 = load i32, i32* %z, align 4
%call1 = call i32 @g(i32* nonnull %arraydecay, i32 %4, i32 %5, i32 %6, i32 0, i32 0)
ret i32 %call1
}
; CHECK-LABEL: test_local_realign
; Setup frame pointer
; CHECK: add r7, sp, #8
; Re-align stack
; CHECK: mov r4, sp
; CHECK-NEXT: lsrs r4, r4, #4
; CHECK-NEXT: lsls r4, r4, #4
; CHECK-NEXT: mov sp, r4
; Arguments to `h` computed relative to SP
; CHECK: add r0, sp, #28
; CHECK-NEXT: add r1, sp, #24
; CHECK-NEXT: add r2, sp, #20
; CHECK-NEXT: bl h
; Load `x`, `y`, and `z` via SP for passing to `g`
; CHECK: ldr r1, [sp, #28]
; CHECK-NEXT: ldr r2, [sp, #24]
; CHECK-NEXT: ldr r3, [sp, #20]
; CHECK: bl g
; VLAs, access via BP.
; int test_local_vla(int n) {
; int v[n];
; int x, y, z;
; h(&x, &y, &z);
; return g(v, x, y, z, 0, 0);
; }
define dso_local i32 @test_local_vla(i32 %n) local_unnamed_addr {
entry:
%x = alloca i32, align 4
%y = alloca i32, align 4
%z = alloca i32, align 4
%vla = alloca i32, i32 %n, align 4
%0 = bitcast i32* %x to i8*
%1 = bitcast i32* %y to i8*
%2 = bitcast i32* %z to i8*
%call = call i32 @h(i32* nonnull %x, i32* nonnull %y, i32* nonnull %z)
%3 = load i32, i32* %x, align 4
%4 = load i32, i32* %y, align 4
%5 = load i32, i32* %z, align 4
%call1 = call i32 @g(i32* nonnull %vla, i32 %3, i32 %4, i32 %5, i32 0, i32 0)
ret i32 %call1
}
; CHECK-LABEL: test_local_vla
; Setup frame pointer
; CHECK: add r7, sp, #12
; Setup base pointer
; CHECK: mov r6, sp
; CHECK: mov r5, r6
; Arguments to `h` compute relative to BP
; CHECK: adds r0, r6, #7
; CHECK-NEXT: adds r0, #1
; CHECK-NEXT: adds r1, r6, #4
; CHECK-NEXT: mov r2, r6
; CHECK-NEXT: bl h
; Load `x`, `y`, `z` via BP (r5 should still have the value of r6 from the move
; above)
; CHECK: ldr r3, [r5]
; CHECK-NEXT: ldr r2, [r5, #4]
; CHECK-NEXT: ldr r1, [r5, #8]
; CHECK: bl g
; Moving SP, access via SP.
; int test_local_moving_sp(int n) {
; int v[4];
; int x, y, z;
; return u(v, &x, &y, s, s) + u(v, &y, &z, s, s);
; }
define dso_local i32 @test_local_moving_sp(i32 %n) local_unnamed_addr {
entry:
%v = alloca [4 x i32], align 4
%x = alloca i32, align 4
%y = alloca i32, align 4
%z = alloca i32, align 4
%0 = bitcast [4 x i32]* %v to i8*
%1 = bitcast i32* %x to i8*
%2 = bitcast i32* %y to i8*
%3 = bitcast i32* %z to i8*
%arraydecay = getelementptr inbounds [4 x i32], [4 x i32]* %v, i32 0, i32 0
%call = call i32 @u(i32* nonnull %arraydecay, i32* nonnull %x, i32* nonnull %y, %struct.S* byval nonnull align 4 @s, %struct.S* byval nonnull align 4 @s)
%call2 = call i32 @u(i32* nonnull %arraydecay, i32* nonnull %y, i32* nonnull %z, %struct.S* byval nonnull align 4 @s, %struct.S* byval nonnull align 4 @s)
%add = add nsw i32 %call2, %call
ret i32 %add
}
; CHECK-LABEL: test_local_moving_sp
; Locals area
; CHECK: sub sp, #36
; Outoging arguments
; CHECK: sub sp, #508
; CHECK-NEXT: sub sp, #508
; CHECK-NEXT: sub sp, #8
; Argument addresses computed relative to SP
; CHECK: add r4, sp, #1020
; CHECK-NEXT: adds r4, #24
; CHECK: add r1, sp, #1020
; CHECK-NEXT: adds r1, #20
; CHECK: add r5, sp, #1020
; CHECK-NEXT: adds r5, #16
; CHECK: bl u
; Stack restored before next call
; CHECK: add sp, #508
; CHECK-NEXT: add sp, #508
; CHECK-NEXT: add sp, #8
; CHECK: bl u