1 ;; Test for memprof metadata propagation, ensuring metadata is moved to
3 ;; Also check that callsite metadata was updated with inlined stack ids.
5 ;; The following code was used to generate the following IR and its memprof
10 ;; #include <unistd.h>
12 ;; return new char[10];
14 ;; char *foo2() __attribute((noinline)) {
23 ;; int main(int argc, char **argv) {
40 ; RUN: opt -passes=inline %s -S | FileCheck %s
42 ; ModuleID = 'memprof_inline2.cc'
43 source_filename = "memprof_inline2.cc"
44 target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
45 target triple = "x86_64-unknown-linux-gnu"
47 ; Function Attrs: mustprogress uwtable
48 ; CHECK-LABEL: define dso_local noundef ptr @_Z3foov
49 define dso_local noundef ptr @_Z3foov() #0 !dbg !39 {
51 ;; We should keep the original memprof metadata intact.
52 ; CHECK: call {{.*}} @_Znam{{.*}} !memprof ![[ORIGMEMPROF:[0-9]+]]
53 %call = call noalias noundef nonnull ptr @_Znam(i64 noundef 10) #7, !dbg !42, !memprof !43, !callsite !52
54 ret ptr %call, !dbg !53
57 ; Function Attrs: nobuiltin allocsize(0)
58 declare noundef nonnull ptr @_Znam(i64 noundef) #1
60 ;; Mark noinline so we don't inline into calls from bar and baz. We should end
61 ;; up with a memprof metadata on the call to foo below.
62 ; Function Attrs: mustprogress noinline uwtable
63 ; CHECK-LABEL: define dso_local noundef ptr @_Z4foo2v
64 define dso_local noundef ptr @_Z4foo2v() #2 !dbg !54 {
66 ;; We should have memprof metadata for the call stacks from bar and baz,
67 ;; and the callsite metadata should be the concatentation of the id from the
68 ;; inlined call to new and the original callsite.
69 ; CHECK: call {{.*}} @_Znam{{.*}} !memprof ![[NEWMEMPROF:[0-9]+]], !callsite ![[NEWCALLSITE:[0-9]+]]
70 %call = call noundef ptr @_Z3foov(), !dbg !55, !callsite !56
71 ret ptr %call, !dbg !57
74 ; Function Attrs: mustprogress uwtable
75 define dso_local noundef ptr @_Z3barv() #0 !dbg !58 {
77 %call = call noundef ptr @_Z4foo2v(), !dbg !59, !callsite !60
78 ret ptr %call, !dbg !61
81 ; Function Attrs: mustprogress uwtable
82 define dso_local noundef ptr @_Z3bazv() #0 !dbg !62 {
84 %call = call noundef ptr @_Z4foo2v(), !dbg !63, !callsite !64
85 ret ptr %call, !dbg !65
88 ;; Make sure we don't propagate any memprof/callsite metadata
89 ; Function Attrs: mustprogress uwtable
90 ; CHECK-LABEL: define dso_local noundef ptr @notprofiled
91 define dso_local noundef ptr @notprofiled() #0 !dbg !66 {
93 ; CHECK: call {{.*}} @_Znam
95 ; CHECK-NOT: !callsite
96 %call = call noundef ptr @_Z3foov(), !dbg !67
98 ret ptr %call, !dbg !68
101 ; Function Attrs: mustprogress noinline norecurse optnone uwtable
102 define dso_local noundef i32 @main(i32 noundef %argc, ptr noundef %argv) #3 !dbg !69 {
104 %retval = alloca i32, align 4
105 %argc.addr = alloca i32, align 4
106 %argv.addr = alloca ptr, align 8
107 %c = alloca ptr, align 8
108 %d = alloca ptr, align 8
109 %e = alloca ptr, align 8
110 %f = alloca ptr, align 8
111 store i32 0, ptr %retval, align 4
112 store i32 %argc, ptr %argc.addr, align 4
113 store ptr %argv, ptr %argv.addr, align 8
114 ;; The below 4 callsites are all annotated as noinline
115 %call = call noundef ptr @_Z3foov() #8, !dbg !70, !callsite !71
116 store ptr %call, ptr %c, align 8, !dbg !72
117 %call1 = call noundef ptr @_Z3foov() #8, !dbg !73, !callsite !74
118 store ptr %call1, ptr %d, align 8, !dbg !75
119 %call2 = call noundef ptr @_Z3barv() #8, !dbg !76, !callsite !77
120 store ptr %call2, ptr %e, align 8, !dbg !78
121 %call3 = call noundef ptr @_Z3bazv() #8, !dbg !79, !callsite !80
122 store ptr %call3, ptr %f, align 8, !dbg !81
123 %0 = load ptr, ptr %c, align 8, !dbg !82
124 call void @llvm.memset.p0.i64(ptr align 1 %0, i8 0, i64 10, i1 false), !dbg !83
125 %1 = load ptr, ptr %d, align 8, !dbg !84
126 call void @llvm.memset.p0.i64(ptr align 1 %1, i8 0, i64 10, i1 false), !dbg !85
127 %2 = load ptr, ptr %e, align 8, !dbg !86
128 call void @llvm.memset.p0.i64(ptr align 1 %2, i8 0, i64 10, i1 false), !dbg !87
129 %3 = load ptr, ptr %f, align 8, !dbg !88
130 call void @llvm.memset.p0.i64(ptr align 1 %3, i8 0, i64 10, i1 false), !dbg !89
131 %4 = load ptr, ptr %c, align 8, !dbg !90
132 %isnull = icmp eq ptr %4, null, !dbg !91
133 br i1 %isnull, label %delete.end, label %delete.notnull, !dbg !91
135 delete.notnull: ; preds = %entry
136 call void @_ZdaPv(ptr noundef %4) #9, !dbg !92
137 br label %delete.end, !dbg !92
139 delete.end: ; preds = %delete.notnull, %entry
140 %call4 = call i32 @sleep(i32 noundef 200), !dbg !94
141 %5 = load ptr, ptr %d, align 8, !dbg !95
142 %isnull5 = icmp eq ptr %5, null, !dbg !96
143 br i1 %isnull5, label %delete.end7, label %delete.notnull6, !dbg !96
145 delete.notnull6: ; preds = %delete.end
146 call void @_ZdaPv(ptr noundef %5) #9, !dbg !97
147 br label %delete.end7, !dbg !97
149 delete.end7: ; preds = %delete.notnull6, %delete.end
150 %6 = load ptr, ptr %e, align 8, !dbg !98
151 %isnull8 = icmp eq ptr %6, null, !dbg !99
152 br i1 %isnull8, label %delete.end10, label %delete.notnull9, !dbg !99
154 delete.notnull9: ; preds = %delete.end7
155 call void @_ZdaPv(ptr noundef %6) #9, !dbg !100
156 br label %delete.end10, !dbg !100
158 delete.end10: ; preds = %delete.notnull9, %delete.end7
159 %7 = load ptr, ptr %f, align 8, !dbg !101
160 %isnull11 = icmp eq ptr %7, null, !dbg !102
161 br i1 %isnull11, label %delete.end13, label %delete.notnull12, !dbg !102
163 delete.notnull12: ; preds = %delete.end10
164 call void @_ZdaPv(ptr noundef %7) #9, !dbg !103
165 br label %delete.end13, !dbg !103
167 delete.end13: ; preds = %delete.notnull12, %delete.end10
171 ; Function Attrs: argmemonly nofree nounwind willreturn writeonly
172 declare void @llvm.memset.p0.i64(ptr nocapture writeonly, i8, i64, i1 immarg) #4
174 ; Function Attrs: nobuiltin nounwind
175 declare void @_ZdaPv(ptr noundef) #5
177 declare i32 @sleep(i32 noundef) #6
179 attributes #0 = { mustprogress uwtable "disable-tail-calls"="true" "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
180 attributes #1 = { nobuiltin allocsize(0) "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
181 attributes #2 = { mustprogress noinline uwtable "disable-tail-calls"="true" "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
182 attributes #3 = { mustprogress noinline norecurse optnone uwtable "disable-tail-calls"="true" "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
183 attributes #4 = { argmemonly nofree nounwind willreturn writeonly }
184 attributes #5 = { nobuiltin nounwind "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
185 attributes #6 = { "disable-tail-calls"="true" "frame-pointer"="all" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" }
186 attributes #7 = { builtin allocsize(0) }
187 attributes #8 = { noinline }
188 attributes #9 = { builtin nounwind }
191 !llvm.module.flags = !{!2, !3, !4, !5, !6, !7, !8, !9}
194 !0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus_14, file: !1, producer: "clang version 15.0.0 (https://github.com/llvm/llvm-project.git e09c924f98ec157adeaa74819b0aec9a07a1b552)", isOptimized: false, runtimeVersion: 0, emissionKind: LineTablesOnly, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None)
195 !1 = !DIFile(filename: "memprof_inline.cc", directory: "/usr/local/google/home/tejohnson/llvm/tmp", checksumkind: CSK_MD5, checksum: "8711f6fd269e6cb5611fef48bc906eab")
196 !2 = !{i32 7, !"Dwarf Version", i32 5}
197 !3 = !{i32 2, !"Debug Info Version", i32 3}
198 !4 = !{i32 1, !"wchar_size", i32 4}
199 !5 = !{i32 7, !"PIC Level", i32 2}
200 !6 = !{i32 7, !"PIE Level", i32 2}
201 !7 = !{i32 7, !"uwtable", i32 2}
202 !8 = !{i32 7, !"frame-pointer", i32 2}
203 !9 = !{i32 1, !"ProfileSummary", !10}
204 !10 = !{!11, !12, !13, !14, !15, !16, !17, !18, !19, !20}
205 !11 = !{!"ProfileFormat", !"InstrProf"}
206 !12 = !{!"TotalCount", i64 0}
207 !13 = !{!"MaxCount", i64 0}
208 !14 = !{!"MaxInternalCount", i64 0}
209 !15 = !{!"MaxFunctionCount", i64 0}
210 !16 = !{!"NumCounts", i64 0}
211 !17 = !{!"NumFunctions", i64 0}
212 !18 = !{!"IsPartialProfile", i64 0}
213 !19 = !{!"PartialProfileRatio", double 0.000000e+00}
214 !20 = !{!"DetailedSummary", !21}
215 !21 = !{!22, !23, !24, !25, !26, !27, !28, !29, !30, !31, !32, !33, !34, !35, !36, !37}
216 !22 = !{i32 10000, i64 0, i32 0}
217 !23 = !{i32 100000, i64 0, i32 0}
218 !24 = !{i32 200000, i64 0, i32 0}
219 !25 = !{i32 300000, i64 0, i32 0}
220 !26 = !{i32 400000, i64 0, i32 0}
221 !27 = !{i32 500000, i64 0, i32 0}
222 !28 = !{i32 600000, i64 0, i32 0}
223 !29 = !{i32 700000, i64 0, i32 0}
224 !30 = !{i32 800000, i64 0, i32 0}
225 !31 = !{i32 900000, i64 0, i32 0}
226 !32 = !{i32 950000, i64 0, i32 0}
227 !33 = !{i32 990000, i64 0, i32 0}
228 !34 = !{i32 999000, i64 0, i32 0}
229 !35 = !{i32 999900, i64 0, i32 0}
230 !36 = !{i32 999990, i64 0, i32 0}
231 !37 = !{i32 999999, i64 0, i32 0}
232 !38 = !{!"clang version 15.0.0 (https://github.com/llvm/llvm-project.git e09c924f98ec157adeaa74819b0aec9a07a1b552)"}
233 !39 = distinct !DISubprogram(name: "foo", linkageName: "_Z3foov", scope: !1, file: !1, line: 4, type: !40, scopeLine: 4, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
234 !40 = !DISubroutineType(types: !41)
236 !42 = !DILocation(line: 5, column: 10, scope: !39)
237 ;; The first 2 are from the direct calls to foo from main. Those stay on the
238 ;; callsite in foo, which isn't inlined into main due to the callsites in main
239 ;; being annotated as noinline.
240 ;; The second 2 are from the calls from foo2, which inlines its callsite to foo
241 ;; but is not itself inlined into its callers. Therefore they get moved to a
242 ;; new memprof metadata within foo2.
243 !43 = !{!44, !46, !48, !50}
244 !44 = !{!45, !"cold"}
245 !45 = !{i64 -2458008693472584243, i64 7394638144382192936}
246 !46 = !{!47, !"notcold"}
247 !47 = !{i64 -2458008693472584243, i64 -8908997186479157179}
248 !48 = !{!49, !"notcold"}
249 !49 = !{i64 -2458008693472584243, i64 -8079659623765193173, i64 -4805294506621015872}
250 !50 = !{!51, !"cold"}
251 !51 = !{i64 -2458008693472584243, i64 -8079659623765193173, i64 -972865200055133905}
252 ; CHECK: ![[ORIGMEMPROF]] = !{![[ORIGMIB1:[0-9]+]], ![[ORIGMIB2:[0-9]+]], ![[ORIGMIB3:[0-9]+]], ![[ORIGMIB4:[0-9]+]]}
253 ; CHECK: ![[ORIGMIB1]] = !{![[ORIGMIBSTACK1:[0-9]+]], !"cold"}
254 ; CHECK: ![[ORIGMIBSTACK1]] = !{i64 -2458008693472584243, i64 7394638144382192936}
255 ; CHECK: ![[ORIGMIB2]] = !{![[ORIGMIBSTACK2:[0-9]+]], !"notcold"}
256 ; CHECK: ![[ORIGMIBSTACK2]] = !{i64 -2458008693472584243, i64 -8908997186479157179}
257 ; CHECK: ![[ORIGMIB3]] = !{![[ORIGMIBSTACK3:[0-9]+]], !"notcold"}
258 ; CHECK: ![[ORIGMIBSTACK3]] = !{i64 -2458008693472584243, i64 -8079659623765193173, i64 -4805294506621015872}
259 ; CHECK: ![[ORIGMIB4]] = !{![[ORIGMIBSTACK4:[0-9]+]], !"cold"}
260 ; CHECK: ![[ORIGMIBSTACK4]] = !{i64 -2458008693472584243, i64 -8079659623765193173, i64 -972865200055133905}
261 ; CHECK: ![[NEWMEMPROF]] = !{![[ORIGMIB3:[0-9]+]], ![[ORIGMIB4:[0-9]+]]}
262 ; CHECK: ![[NEWCALLSITE]] = !{i64 -2458008693472584243, i64 -8079659623765193173}
263 !52 = !{i64 -2458008693472584243}
264 !53 = !DILocation(line: 5, column: 3, scope: !39)
265 !54 = distinct !DISubprogram(name: "foo2", linkageName: "_Z4foo2v", scope: !1, file: !1, line: 7, type: !40, scopeLine: 7, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
266 !55 = !DILocation(line: 8, column: 10, scope: !54)
267 !56 = !{i64 -8079659623765193173}
268 !57 = !DILocation(line: 8, column: 3, scope: !54)
269 !58 = distinct !DISubprogram(name: "bar", linkageName: "_Z3barv", scope: !1, file: !1, line: 10, type: !40, scopeLine: 10, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
270 !59 = !DILocation(line: 11, column: 10, scope: !58)
271 !60 = !{i64 -972865200055133905}
272 !61 = !DILocation(line: 11, column: 3, scope: !58)
273 !62 = distinct !DISubprogram(name: "baz", linkageName: "_Z3bazv", scope: !1, file: !1, line: 13, type: !40, scopeLine: 13, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
274 !63 = !DILocation(line: 14, column: 10, scope: !62)
275 !64 = !{i64 -4805294506621015872}
276 !65 = !DILocation(line: 14, column: 3, scope: !62)
277 !66 = distinct !DISubprogram(name: "notprofiled", linkageName: "notprofiled", scope: !1, file: !1, line: 400, type: !40, scopeLine: 400, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
278 !67 = !DILocation(line: 401, column: 10, scope: !66)
279 !68 = !DILocation(line: 401, column: 3, scope: !66)
280 !69 = distinct !DISubprogram(name: "main", scope: !1, file: !1, line: 16, type: !40, scopeLine: 16, flags: DIFlagPrototyped, spFlags: DISPFlagDefinition, unit: !0, retainedNodes: !41)
281 !70 = !DILocation(line: 17, column: 13, scope: !69)
282 !71 = !{i64 -8908997186479157179}
283 !72 = !DILocation(line: 17, column: 9, scope: !69)
284 !73 = !DILocation(line: 18, column: 13, scope: !69)
285 !74 = !{i64 7394638144382192936}
286 !75 = !DILocation(line: 18, column: 9, scope: !69)
287 !76 = !DILocation(line: 19, column: 13, scope: !69)
288 !77 = !{i64 -5510257407004945023}
289 !78 = !DILocation(line: 19, column: 9, scope: !69)
290 !79 = !DILocation(line: 20, column: 13, scope: !69)
291 !80 = !{i64 8771588133652501463}
292 !81 = !DILocation(line: 20, column: 9, scope: !69)
293 !82 = !DILocation(line: 21, column: 10, scope: !69)
294 !83 = !DILocation(line: 21, column: 3, scope: !69)
295 !84 = !DILocation(line: 22, column: 10, scope: !69)
296 !85 = !DILocation(line: 22, column: 3, scope: !69)
297 !86 = !DILocation(line: 23, column: 10, scope: !69)
298 !87 = !DILocation(line: 23, column: 3, scope: !69)
299 !88 = !DILocation(line: 24, column: 10, scope: !69)
300 !89 = !DILocation(line: 24, column: 3, scope: !69)
301 !90 = !DILocation(line: 25, column: 12, scope: !69)
302 !91 = !DILocation(line: 25, column: 3, scope: !69)
303 !92 = !DILocation(line: 25, column: 3, scope: !93)
304 !93 = !DILexicalBlockFile(scope: !69, file: !1, discriminator: 2)
305 !94 = !DILocation(line: 26, column: 3, scope: !69)
306 !95 = !DILocation(line: 27, column: 12, scope: !69)
307 !96 = !DILocation(line: 27, column: 3, scope: !69)
308 !97 = !DILocation(line: 27, column: 3, scope: !93)
309 !98 = !DILocation(line: 28, column: 12, scope: !69)
310 !99 = !DILocation(line: 28, column: 3, scope: !69)
311 !100 = !DILocation(line: 28, column: 3, scope: !93)
312 !101 = !DILocation(line: 29, column: 12, scope: !69)
313 !102 = !DILocation(line: 29, column: 3, scope: !69)
314 !103 = !DILocation(line: 29, column: 3, scope: !93)
315 !104 = !DILocation(line: 30, column: 3, scope: !69)