1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
| ; RUN: llc < %s -mtriple=x86_64-unknown-linux-gnu | FileCheck %s -check-prefix=X64
; RUN: llc < %s -mtriple=i686-unknown-linux-gnu | FileCheck %s -check-prefix=X32
; CHECK-LABEL: foo
; Check the functionality of the local stack symbol table ordering
; heuristics.
; The test has a bunch of locals of various sizes that are referenced a
; different number of times.
;
; a : 120B, 9 uses, density = 0.075
; aa : 4000B, 1 use, density = 0.00025
; b : 4B, 1 use, density = 0.25
; cc : 4000B, 2 uses density = 0.0005
; d : 4B, 2 uses density = 0.5
; e : 4B, 3 uses density = 0.75
; f : 4B, 4 uses density = 1
;
; Given the size, number of uses and calculated density (uses / size), we're
; going to hope that f gets allocated closest to the stack pointer,
; followed by e, d, b, then a (to check for just a few).
; We use gnu-inline asm between calls to prevent registerization of addresses
; so that we get exact counts.
;
; The test is taken from something like this:
; void foo()
; {
; int f; // 4 uses. 4 / 4 = 1
; int a[30]; // 9 uses. 8 / 120 = 0.06
; int aa[1000]; // 1 use. 1 / 4000 =
; int e; // 3 uses. 3 / 4 = 0.75
; int cc[1000]; // 2 uses. 2 / 4000 =
; int b; // 1 use. 1 / 4 = 0.25
; int d; // 2 uses. 2 / 4 = 0.5
; int aaa[1000]; // 2 uses. 2 / 4000
;
;
; check_a(&a);
; bar1(&aaa);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar1(&a);
; check_f(&f);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar1(&a);
; bar3(&aa, &aaa, &cc);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar2(&a,&cc);
; check_b(&b);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar1(&a);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar2(&a, &f);
; check_e(&e);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar1(&a);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar2(&e, &f);
; check_d(&d);
; bar1(&a);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar3(&d, &e, &f);
; asm ("":::"esi","edi","ebp","ebx","rbx","r12","r13","r14","r15","rbp");
; bar1(&a);
; }
;
; X64: leaq 16(%rsp), %rdi
; X64: callq check_a
; X64: callq bar1
; X64: callq bar1
; X64: movq %rsp, %rdi
; X64: callq check_f
; X64: callq bar1
; X64: callq bar3
; X64: callq bar2
; X64: leaq 12(%rsp), %rdi
; X64: callq check_b
; X64: callq bar1
; X64: callq bar2
; X64: leaq 4(%rsp), %rdi
; X64: callq check_e
; X64: callq bar1
; X64: callq bar2
; X64: leaq 8(%rsp), %rdi
; X64: callq check_d
; X32: leal 32(%esp)
; X32: calll check_a
; X32: calll bar1
; X32: calll bar1
; X32: leal 16(%esp)
; X32: calll check_f
; X32: calll bar1
; X32: calll bar3
; X32: calll bar2
; X32: leal 28(%esp)
; X32: calll check_b
; X32: calll bar1
; X32: calll bar2
; X32: leal 20(%esp)
; X32: calll check_e
; X32: calll bar1
; X32: calll bar2
; X32: leal 24(%esp)
; X32: calll check_d
define void @foo() nounwind uwtable {
entry:
%f = alloca i32, align 4
%a = alloca [30 x i32], align 16
%aa = alloca [1000 x i32], align 16
%e = alloca i32, align 4
%cc = alloca [1000 x i32], align 16
%b = alloca i32, align 4
%d = alloca i32, align 4
%aaa = alloca [1000 x i32], align 16
%0 = bitcast i32* %f to i8*
call void @llvm.lifetime.start.p0i8(i64 4, i8* %0) #1
%1 = bitcast [30 x i32]* %a to i8*
call void @llvm.lifetime.start.p0i8(i64 120, i8* %1) #1
%2 = bitcast [1000 x i32]* %aa to i8*
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %2) #1
%3 = bitcast i32* %e to i8*
call void @llvm.lifetime.start.p0i8(i64 4, i8* %3) #1
%4 = bitcast [1000 x i32]* %cc to i8*
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %4) #1
%5 = bitcast i32* %b to i8*
call void @llvm.lifetime.start.p0i8(i64 4, i8* %5) #1
%6 = bitcast i32* %d to i8*
call void @llvm.lifetime.start.p0i8(i64 4, i8* %6) #1
%7 = bitcast [1000 x i32]* %aaa to i8*
call void @llvm.lifetime.start.p0i8(i64 4000, i8* %7) #1
%call = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @check_a to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
%call1 = call i32 ([1000 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([1000 x i32]*, ...)*)([1000 x i32]* %aaa)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call2 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
%call3 = call i32 (i32*, ...) bitcast (i32 (...)* @check_f to i32 (i32*, ...)*)(i32* %f)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call4 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
%call5 = call i32 ([1000 x i32]*, [1000 x i32]*, [1000 x i32]*, ...) bitcast (i32 (...)* @bar3 to i32 ([1000 x i32]*, [1000 x i32]*, [1000 x i32]*, ...)*)([1000 x i32]* %aa, [1000 x i32]* %aaa, [1000 x i32]* %cc)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call6 = call i32 ([30 x i32]*, [1000 x i32]*, ...) bitcast (i32 (...)* @bar2 to i32 ([30 x i32]*, [1000 x i32]*, ...)*)([30 x i32]* %a, [1000 x i32]* %cc)
%call7 = call i32 (i32*, ...) bitcast (i32 (...)* @check_b to i32 (i32*, ...)*)(i32* %b)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call8 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call9 = call i32 ([30 x i32]*, i32*, ...) bitcast (i32 (...)* @bar2 to i32 ([30 x i32]*, i32*, ...)*)([30 x i32]* %a, i32* %f)
%call10 = call i32 (i32*, ...) bitcast (i32 (...)* @check_e to i32 (i32*, ...)*)(i32* %e)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call11 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call12 = call i32 (i32*, i32*, ...) bitcast (i32 (...)* @bar2 to i32 (i32*, i32*, ...)*)(i32* %e, i32* %f)
%call13 = call i32 (i32*, ...) bitcast (i32 (...)* @check_d to i32 (i32*, ...)*)(i32* %d)
%call14 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call15 = call i32 (i32*, i32*, i32*, ...) bitcast (i32 (...)* @bar3 to i32 (i32*, i32*, i32*, ...)*)(i32* %d, i32* %e, i32* %f)
call void asm sideeffect "", "~{esi},~{edi},~{ebp},~{ebx},~{rbx},~{r12},~{r13},~{r14},~{r15},~{rbp},~{dirflag},~{fpsr},~{flags}"() #1
%call16 = call i32 ([30 x i32]*, ...) bitcast (i32 (...)* @bar1 to i32 ([30 x i32]*, ...)*)([30 x i32]* %a)
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %7) #1
call void @llvm.lifetime.end.p0i8(i64 4, i8* %6) #1
call void @llvm.lifetime.end.p0i8(i64 4, i8* %5) #1
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %4) #1
call void @llvm.lifetime.end.p0i8(i64 4, i8* %3) #1
call void @llvm.lifetime.end.p0i8(i64 4000, i8* %2) #1
call void @llvm.lifetime.end.p0i8(i64 120, i8* %1) #1
call void @llvm.lifetime.end.p0i8(i64 4, i8* %0) #1
ret void
}
; Function Attrs: nounwind
declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #1
declare i32 @check_a(...) #2
declare i32 @bar1(...) #2
declare i32 @check_f(...) #2
declare i32 @bar3(...) #2
declare i32 @bar2(...) #2
declare i32 @check_b(...) #2
declare i32 @check_e(...) #2
declare i32 @check_d(...) #2
; Function Attrs: nounwind
declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #1
|