; This is a basic test of the alloca instruction. ; RUN: %if --need=target_X8632 --command %p2i --filetype=obj --disassemble \ ; RUN: --target x8632 -i %s --args -O2 -allow-externally-defined-symbols \ ; RUN: | %if --need=target_X8632 --command FileCheck %s ; RUN: %if --need=target_MIPS32 --need=allow_dump \ ; RUN: --command %p2i --filetype=asm --assemble --disassemble --target \ ; RUN: mips32 -i %s --args -O2 -allow-externally-defined-symbols \ ; RUN: | %if --need=target_MIPS32 --need=allow_dump \ ; RUN: --command FileCheck --check-prefix MIPS32 %s ; Test that a sequence of allocas with less than stack alignment get fused. define internal void @fused_small_align(i32 %arg) { entry: %a1 = alloca i8, i32 8, align 4 %a2 = alloca i8, i32 12, align 4 %a3 = alloca i8, i32 16, align 8 %p1 = bitcast i8* %a1 to i32* %p2 = bitcast i8* %a2 to i32* %p3 = bitcast i8* %a3 to i32* store i32 %arg, i32* %p1, align 1 store i32 %arg, i32* %p2, align 1 store i32 %arg, i32* %p3, align 1 ret void } ; CHECK-LABEL: fused_small_align ; CHECK-NEXT: sub esp,0x3c ; CHECK-NEXT: mov eax,DWORD PTR [esp+0x40] ; CHECK-NEXT: mov DWORD PTR [esp+0x10],eax ; CHECK-NEXT: mov DWORD PTR [esp+0x18],eax ; CHECK-NEXT: mov DWORD PTR [esp],eax ; CHECK-NEXT: add esp,0x3c ; MIPS32-LABEL: fused_small_align ; MIPS32: addiu sp,sp,{{.*}} ; MIPS32: move v0,a0 ; MIPS32: sw v0,{{.*}}(sp) ; MIPS32: move v0,a0 ; MIPS32: sw v0,{{.*}}(sp) ; MIPS32: sw a0,{{.*}}(sp) ; MIPS32: addiu sp,sp,{{.*}} ; Test that a sequence of allocas with greater than stack alignment get fused. define internal void @fused_large_align(i32 %arg) { entry: %a1 = alloca i8, i32 8, align 32 %a2 = alloca i8, i32 12, align 64 %a3 = alloca i8, i32 16, align 32 %p1 = bitcast i8* %a1 to i32* %p2 = bitcast i8* %a2 to i32* %p3 = bitcast i8* %a3 to i32* store i32 %arg, i32* %p1, align 1 store i32 %arg, i32* %p2, align 1 store i32 %arg, i32* %p3, align 1 ret void } ; CHECK-LABEL: fused_large_align ; CHECK-NEXT: push ebp ; CHECK-NEXT: mov ebp,esp ; CHECK-NEXT: sub esp,0xb8 ; CHECK-NEXT: and esp,0xffffffc0 ; CHECK-NEXT: mov eax,DWORD PTR [ebp+0x8] ; CHECK-NEXT: mov DWORD PTR [esp+0x40],eax ; CHECK-NEXT: mov DWORD PTR [esp],eax ; CHECK-NEXT: mov DWORD PTR [esp+0x60],eax ; CHECK-NEXT: mov esp,ebp ; CHECK-NEXT: pop ebp ; MIPS32-LABEL: fused_large_align ; MIPS32: addiu sp,sp,{{.*}} ; MIPS32: sw s8,{{.*}}(sp) ; MIPS32: move s8,sp ; MIPS32: move v0,a0 ; MIPS32: sw v0,{{.*}}(sp) ; MIPS32: move v0,a0 ; MIPS32: sw v0,{{.*}}(sp) ; MIPS32: sw a0,{{.*}}(sp) ; MIPS32: move sp,s8 ; MIPS32: lw s8,{{.*}}(sp) ; MIPS32: addiu sp,sp,{{.*}} ; Test that an interior pointer into a rematerializable variable is also ; rematerializable, and test that it is detected even when the use appears ; syntactically before the definition. Test that it is folded into mem ; operands, and also rematerializable through an lea instruction for direct use. define internal i32 @fused_derived(i32 %arg) { entry: %a1 = alloca i8, i32 128, align 4 %a2 = alloca i8, i32 128, align 4 %a3 = alloca i8, i32 128, align 4 br label %block2 block1: %a2_i32 = bitcast i8* %a2 to i32* store i32 %arg, i32* %a2_i32, align 1 store i32 %arg, i32* %derived, align 1 ret i32 %retval block2: ; The following are all rematerializable variables deriving from %a2. %p2 = ptrtoint i8* %a2 to i32 %d = add i32 %p2, 12 %retval = add i32 %p2, 1 %derived = inttoptr i32 %d to i32* br label %block1 } ; CHECK-LABEL: fused_derived ; CHECK-NEXT: sub esp,0x18c ; CHECK-NEXT: mov [[ARG:e..]],DWORD PTR [esp+0x190] ; CHECK-NEXT: jmp ; CHECK-NEXT: mov DWORD PTR [esp+0x80],[[ARG]] ; CHECK-NEXT: mov DWORD PTR [esp+0x8c],[[ARG]] ; CHECK-NEXT: lea eax,[esp+0x81] ; CHECK-NEXT: add esp,0x18c ; CHECK-NEXT: ret ; MIPS32-LABEL: fused_derived ; MIPS32: addiu sp,sp,{{.*}} ; MIPS32: b ; MIPS32: move v0,a0 ; MIPS32: sw v0,{{.*}}(sp) ; MIPS32: sw a0,{{.*}}(sp) ; MIPS32: addiu v0,sp,129 ; MIPS32: addiu sp,sp,{{.*}} ; Test that a fixed alloca gets referenced by the frame pointer. define internal void @fused_small_align_with_dynamic(i32 %arg) { entry: %a1 = alloca i8, i32 8, align 16 br label %next next: %a2 = alloca i8, i32 12, align 1 %a3 = alloca i8, i32 16, align 1 %p1 = bitcast i8* %a1 to i32* %p2 = bitcast i8* %a2 to i32* %p3 = bitcast i8* %a3 to i32* store i32 %arg, i32* %p1, align 1 store i32 %arg, i32* %p2, align 1 store i32 %arg, i32* %p3, align 1 ret void } ; CHECK-LABEL: fused_small_align_with_dynamic ; CHECK-NEXT: push ebp ; CHECK-NEXT: mov ebp,esp ; CHECK-NEXT: sub esp,0x18 ; CHECK-NEXT: mov eax,DWORD PTR [ebp+0x8] ; CHECK-NEXT: sub esp,0x10 ; CHECK-NEXT: mov ecx,esp ; CHECK-NEXT: sub esp,0x10 ; CHECK-NEXT: mov edx,esp ; CHECK-NEXT: mov DWORD PTR [ebp-0x18],eax ; CHECK-NEXT: mov DWORD PTR [ecx],eax ; CHECK-NEXT: mov DWORD PTR [edx],eax ; CHECK-NEXT: mov esp,ebp ; CHECK-NEXT: pop ebp ; MIPS32-LABEL: fused_small_align_with_dynamic ; MIPS32: addiu sp,sp,{{.*}} ; MIPS32: sw s8,{{.*}}(sp) ; MIPS32: move s8,sp ; MIPS32: addiu v0,sp,0 ; MIPS32: addiu v1,sp,16 ; MIPS32: move a1,a0 ; MIPS32: sw a1,32(s8) ; MIPS32: move a1,a0 ; MIPS32: sw a1,0(v0) ; MIPS32: sw a0,0(v1) ; MIPS32: move sp,s8 ; MIPS32: lw s8,{{.*}}(sp) ; MIPS32: addiu sp,sp,{{.*}} ; Test that a sequence with greater than stack alignment and dynamic size ; get folded and referenced correctly; define internal void @fused_large_align_with_dynamic(i32 %arg) { entry: %a1 = alloca i8, i32 8, align 32 %a2 = alloca i8, i32 12, align 32 %a3 = alloca i8, i32 16, align 1 %a4 = alloca i8, i32 16, align 1 br label %next next: %a5 = alloca i8, i32 16, align 1 %p1 = bitcast i8* %a1 to i32* %p2 = bitcast i8* %a2 to i32* %p3 = bitcast i8* %a3 to i32* %p4 = bitcast i8* %a4 to i32* %p5 = bitcast i8* %a5 to i32* store i32 %arg, i32* %p1, align 1 store i32 %arg, i32* %p2, align 1 store i32 %arg, i32* %p3, align 1 store i32 %arg, i32* %p4, align 1 store i32 %arg, i32* %p5, align 1 ret void } ; CHECK-LABEL: fused_large_align_with_dynamic ; CHECK-NEXT: push ebx ; CHECK-NEXT: push ebp ; CHECK-NEXT: mov ebp,esp ; CHECK-NEXT: sub esp,0x24 ; CHECK-NEXT: mov eax,DWORD PTR [ebp+0xc] ; CHECK-NEXT: and esp,0xffffffe0 ; CHECK-NEXT: sub esp,0x40 ; CHECK-NEXT: mov ecx,esp ; CHECK-NEXT: mov edx,ecx ; CHECK-NEXT: add ecx,0x20 ; CHECK-NEXT: add edx,0x0 ; CHECK-NEXT: sub esp,0x10 ; CHECK-NEXT: mov ebx,esp ; CHECK-NEXT: mov DWORD PTR [edx],eax ; CHECK-NEXT: mov DWORD PTR [ecx],eax ; CHECK-NEXT: mov DWORD PTR [ebp-0x14],eax ; CHECK-NEXT: mov DWORD PTR [ebp-0x24],eax ; CHECK-NEXT: mov DWORD PTR [ebx],eax ; CHECK-NEXT: mov esp,ebp ; CHECK-NEXT: pop ebp ; MIPS32-LABEL: fused_large_align_with_dynamic ; MIPS32: addiu sp,sp,{{.*}} ; MIPS32: sw s8,{{.*}}(sp) ; MIPS32: move s8,sp ; MIPS32: addiu v0,sp,0 ; MIPS32: addiu v1,sp,64 ; MIPS32: move a1,v0 ; MIPS32: move a2,a0 ; MIPS32: sw a2,0(a1) ; MIPS32: move a1,a0 ; MIPS32: sw a1,32(v0) ; MIPS32: move v0,a0 ; MIPS32: sw v0,80(s8) ; MIPS32: move v0,a0 ; MIPS32: sw v0,96(s8) ; MIPS32: sw a0,0(v1) ; MIPS32: move sp,s8 ; MIPS32: lw s8,{{.*}}(sp) ; MIPS32: addiu sp,sp,{{.*}}