185 lines
8.0 KiB
LLVM
185 lines
8.0 KiB
LLVM
|
; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu | FileCheck %s -check-prefix=X64
|
||
|
; RUN: llc < %s -mtriple=i686-unknown-linux-gnu | FileCheck %s -check-prefix=X32
|
||
|
|
||
|
; CHECK-LABEL: foo
|
||
|
|
||
|
; Check the functionality of the local stack symbol table ordering
|
||
|
; heuristics.
|
||
|
; The test has a bunch of locals of various sizes that are referenced a
|
||
|
; different number of times.
|
||
|
;
|
||
|
; a : 120B, 9 uses, density = 0.075
|
||
|
; aa : 4000B, 1 use, density = 0.00025
|
||
|
; b : 4B, 1 use, density = 0.25
|
||
|
; cc : 4000B, 2 uses density = 0.0005
|
||
|
; d : 4B, 2 uses density = 0.5
|
||
|
; e : 4B, 3 uses density = 0.75
|
||
|
; f : 4B, 4 uses density = 1
|
||
|
;
|
||
|
; Given the size, number of uses and calculated density (uses / size), we're
|
||
|
; going to hope that f gets allocated closest to the stack pointer,
|
||
|
; followed by e, d, b, then a (to check for just a few).
|
||
|
; We use gnu-inline asm between calls to prevent registerization of addresses
|
||
|
; so that we get exact counts.
|
||
|
;
|
||
|
; The test is taken from something like this:
|
||
|
; void foo()
|
||
|
; {
|
||
|
; int f; // 4 uses. 4 / 4 = 1
|
||
|
; int a[30]; // 9 uses. 8 / 120 = 0.06
|
||
|
; int aa[1000]; // 1 use. 1 / 4000 =
|
||
|
; int e; // 3 uses. 3 / 4 = 0.75
|
||
|
; int cc[1000]; // 2 uses. 2 / 4000 =
|
||
|
; int b; // 1 use. 1 / 4 = 0.25
|
||
|
; int d; // 2 uses. 2 / 4 = 0.5
|
||
|
; int aaa[1000]; // 2 uses. 2 / 4000
|
||
|
;
|
||
|
;
|
||
|
; check_a(&a);
|
||
|
; bar1(&aaa);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar1(&a);
|
||
|
; check_f(&f);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar1(&a);
|
||
|
; bar3(&aa, &aaa, &cc);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar2(&a,&cc);
|
||
|
; check_b(&b);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar1(&a);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar2(&a, &f);
|
||
|
; check_e(&e);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar1(&a);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar2(&e, &f);
|
||
|
; check_d(&d);
|
||
|
; bar1(&a);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar3(&d, &e, &f);
|
||
|
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
|
||
|
; bar1(&a);
|
||
|
; }
|
||
|
;
|
||
|
; X64: leaq 16(%rsp), %rdi
|
||
|
; X64: callq check_a
|
||
|
; X64: callq bar1
|
||
|
; X64: callq bar1
|
||
|
; X64: movq %rsp, %rdi
|
||
|
; X64: callq check_f
|
||
|
; X64: callq bar1
|
||
|
; X64: callq bar3
|
||
|
; X64: callq bar2
|
||
|
; X64: leaq 12(%rsp), %rdi
|
||
|
; X64: callq check_b
|
||
|
; X64: callq bar1
|
||
|
; X64: callq bar2
|
||
|
; X64: leaq 4(%rsp), %rdi
|
||
|
; X64: callq check_e
|
||
|
; X64: callq bar1
|
||
|
; X64: callq bar2
|
||
|
; X64: leaq 8(%rsp), %rdi
|
||
|
; X64: callq check_d
|
||
|
|
||
|
; X32: leal 32(%esp)
|
||
|
; X32: calll check_a
|
||
|
; X32: calll bar1
|
||
|
; X32: calll bar1
|
||
|
; X32: leal 16(%esp)
|
||
|
; X32: calll check_f
|
||
|
; X32: calll bar1
|
||
|
; X32: calll bar3
|
||
|
; X32: calll bar2
|
||
|
; X32: leal 28(%esp)
|
||
|
; X32: calll check_b
|
||
|
; X32: calll bar1
|
||
|
; X32: calll bar2
|
||
|
; X32: leal 20(%esp)
|
||
|
; X32: calll check_e
|
||
|
; X32: calll bar1
|
||
|
; X32: calll bar2
|
||
|
; X32: leal 24(%esp)
|
||
|
; X32: calll check_d
|
||
|
|
||
|
|
||
|
define void @foo() nounwind uwtable {
|
||
|
entry:
|
||
|
%f = alloca i32, align 4
|
||
|
%a = alloca [30 x i32], align 16
|
||
|
%aa = alloca [1000 x i32], align 16
|
||
|
%e = alloca i32, align 4
|
||
|
%cc = alloca [1000 x i32], align 16
|
||
|
%b = alloca i32, align 4
|
||
|
%d = alloca i32, align 4
|
||
|
%aaa = alloca [1000 x i32], align 16
|
||
|
%0 = bitcast i32* %f to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4, i8* %0) #1
|
||
|
%1 = bitcast [30 x i32]* %a to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 120, i8* %1) #1
|
||
|
%2 = bitcast [1000 x i32]* %aa to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %2) #1
|
||
|
%3 = bitcast i32* %e to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4, i8* %3) #1
|
||
|
%4 = bitcast [1000 x i32]* %cc to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %4) #1
|
||
|
%5 = bitcast i32* %b to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4, i8* %5) #1
|
||
|
%6 = bitcast i32* %d to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4, i8* %6) #1
|
||
|
%7 = bitcast [1000 x i32]* %aaa to i8*
|
||
|
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %7) #1
|
||
|
%call = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @check_a to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
%call1 = call i32 ([1000 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([1000 x i32]*, ...)*)([1000 x i32]* %aaa)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call2 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
%call3 = call i32 (i32*, ...) bitcast (i32 (...)* @check_f to i32 (i32*, ...)*)(i32* %f)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call4 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
%call5 = call i32 ([1000 x i32]*, [1000 x i32]*, [1000 x i32]*, ...) bitcast (i32 (...)* @bar3 to i32 ([1000 x i32]*, [1000 x i32]*, [1000 x i32]*, ...)*)([1000 x i32]* %aa, [1000 x i32]* %aaa, [1000 x i32]* %cc)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call6 = call i32 ([30 x i32]*, [1000 x i32]*, ...) bitcast (i32 (...)* @bar2 to i32 ([30 x i32]*, [1000 x i32]*, ...)*)([30 x i32]* %a, [1000 x i32]* %cc)
|
||
|
%call7 = call i32 (i32*, ...) bitcast (i32 (...)* @check_b to i32 (i32*, ...)*)(i32* %b)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call8 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call9 = call i32 ([30 x i32]*, i32*, ...) bitcast (i32 (...)* @bar2 to i32 ([30 x i32]*, i32*, ...)*)([30 x i32]* %a, i32* %f)
|
||
|
%call10 = call i32 (i32*, ...) bitcast (i32 (...)* @check_e to i32 (i32*, ...)*)(i32* %e)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call11 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call12 = call i32 (i32*, i32*, ...) bitcast (i32 (...)* @bar2 to i32 (i32*, i32*, ...)*)(i32* %e, i32* %f)
|
||
|
%call13 = call i32 (i32*, ...) bitcast (i32 (...)* @check_d to i32 (i32*, ...)*)(i32* %d)
|
||
|
%call14 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call15 = call i32 (i32*, i32*, i32*, ...) bitcast (i32 (...)* @bar3 to i32 (i32*, i32*, i32*, ...)*)(i32* %d, i32* %e, i32* %f)
|
||
|
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
|
||
|
%call16 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %7) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4, i8* %6) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4, i8* %5) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %4) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4, i8* %3) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %2) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 120, i8* %1) #1
|
||
|
call void @llvm.lifetime.end.p0i8(i64 4, i8* %0) #1
|
||
|
ret void
|
||
|
}
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
|
||
|
|
||
|
declare i32 @check_a(...) #2
|
||
|
declare i32 @bar1(...) #2
|
||
|
declare i32 @check_f(...) #2
|
||
|
declare i32 @bar3(...) #2
|
||
|
declare i32 @bar2(...) #2
|
||
|
declare i32 @check_b(...) #2
|
||
|
declare i32 @check_e(...) #2
|
||
|
declare i32 @check_d(...) #2
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1
|
||
|
|