1 ; REQUIRES: x86_64-linux
2 ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/pseudo-probe-profile-mismatch.prof -report-profile-staleness -persist-profile-staleness -S 2>%t -o %t.ll
3 ; RUN: FileCheck %s --input-file %t
4 ; RUN: FileCheck %s --input-file %t.ll -check-prefix=CHECK-MD
5 ; RUN: llc < %t.ll -filetype=obj -o %t.obj
6 ; RUN: llvm-objdump --section-headers %t.obj | FileCheck %s --check-prefix=CHECK-OBJ
7 ; RUN: llc < %t.ll -filetype=asm -o - | FileCheck %s --check-prefix=CHECK-ASM
9 ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/pseudo-probe-profile-mismatch-nested.prof -report-profile-staleness -persist-profile-staleness -S 2>&1 | FileCheck %s --check-prefix=CHECK-NESTED
12 ; CHECK: (1/3) of functions' profile are invalid and (10/50) of samples are discarded due to function hash mismatch.
13 ; CHECK: (2/3) of callsites' profile are invalid and (20/30) of samples are discarded due to callsite location mismatch.
15 ; CHECK-MD: ![[#]] = !{!"NumMismatchedFuncHash", i64 1, !"TotalProfiledFunc", i64 3, !"MismatchedFuncHashSamples", i64 10, !"TotalFuncHashSamples", i64 50, !"NumMismatchedCallsites", i64 2, !"TotalProfiledCallsites", i64 3, !"MismatchedCallsiteSamples", i64 20, !"TotalCallsiteSamples", i64 30}
17 ; CHECK-OBJ: .llvm_stats
19 ; CHECK-ASM: .section .llvm_stats,"",@progbits
21 ; CHECK-ASM: .ascii "NumMismatchedFuncHash"
23 ; CHECK-ASM: .ascii "MQ=="
25 ; CHECK-ASM: .ascii "TotalProfiledFunc"
27 ; CHECK-ASM: .ascii "Mw=="
29 ; CHECK-ASM: .ascii "MismatchedFuncHashSamples"
31 ; CHECK-ASM: .ascii "MTA="
33 ; CHECK-ASM: .ascii "TotalFuncHashSamples"
35 ; CHECK-ASM: .ascii "NTA="
37 ; CHECK-ASM: .ascii "NumMismatchedCallsites"
39 ; CHECK-ASM: .ascii "Mg=="
41 ; CHECK-ASM: .ascii "TotalProfiledCallsites"
43 ; CHECK-ASM: .ascii "Mw=="
45 ; CHECK-ASM: .ascii "MismatchedCallsiteSamples"
47 ; CHECK-ASM: .ascii "MjA="
49 ; CHECK-ASM: .ascii "TotalCallsiteSamples"
51 ; CHECK-ASM: .ascii "MzA="
53 ; CHECK-NESTED: (1/2) of functions' profile are invalid and (211/311) of samples are discarded due to function hash mismatch.
56 target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
57 target triple = "x86_64-unknown-linux-gnu"
59 @x = dso_local global i32 0, align 4, !dbg !0
61 ; Function Attrs: nounwind uwtable
62 define dso_local i32 @foo(i32 noundef %x) #0 !dbg !16 {
64 %y = alloca i32, align 4
65 call void @llvm.dbg.value(metadata i32 %x, metadata !20, metadata !DIExpression()), !dbg !22
66 call void @llvm.lifetime.start.p0(i64 4, ptr nonnull %y), !dbg !23
67 call void @llvm.dbg.declare(metadata ptr %y, metadata !21, metadata !DIExpression()), !dbg !24
68 call void @llvm.pseudoprobe(i64 6699318081062747564, i64 1, i32 0, i64 -1), !dbg !25
69 %add = add nsw i32 %x, 1, !dbg !26
70 store volatile i32 %add, ptr %y, align 4, !dbg !24, !tbaa !27
71 %y.0. = load volatile i32, ptr %y, align 4, !dbg !31, !tbaa !27
72 %add1 = add nsw i32 %y.0., 1, !dbg !32
73 call void @llvm.lifetime.end.p0(i64 4, ptr nonnull %y), !dbg !33
74 ret i32 %add1, !dbg !34
77 ; Function Attrs: mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn
78 declare void @llvm.dbg.declare(metadata, metadata, metadata) #1
80 ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
81 declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2
83 ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
84 declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2
86 ; Function Attrs: noinline nounwind uwtable
87 define dso_local i32 @bar(i32 noundef %x) #3 !dbg !35 {
89 call void @llvm.dbg.value(metadata i32 %x, metadata !37, metadata !DIExpression()), !dbg !38
90 call void @llvm.pseudoprobe(i64 -2012135647395072713, i64 1, i32 0, i64 -1), !dbg !39
91 %add = add nsw i32 %x, 2, !dbg !40
92 ret i32 %add, !dbg !41
95 ; Function Attrs: noinline nounwind uwtable
96 define dso_local i32 @matched(i32 noundef %x) #3 !dbg !42 {
98 call void @llvm.dbg.value(metadata i32 %x, metadata !44, metadata !DIExpression()), !dbg !45
99 call void @llvm.pseudoprobe(i64 -5844448289301669773, i64 1, i32 0, i64 -1), !dbg !46
100 %add = add nsw i32 %x, 3, !dbg !47
101 ret i32 %add, !dbg !48
104 ; Function Attrs: nounwind uwtable
105 define dso_local i32 @main() #0 !dbg !49 {
107 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 1, i32 0, i64 -1), !dbg !59
108 call void @llvm.dbg.value(metadata i32 0, metadata !53, metadata !DIExpression()), !dbg !60
109 br label %for.cond, !dbg !61
111 for.cond: ; preds = %for.cond.cleanup3, %entry
112 %i.0 = phi i32 [ 0, %entry ], [ %inc8, %for.cond.cleanup3 ], !dbg !60
113 call void @llvm.dbg.value(metadata i32 %i.0, metadata !53, metadata !DIExpression()), !dbg !60
114 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 2, i32 0, i64 -1), !dbg !62
115 %cmp = icmp ult i32 %i.0, 1000, !dbg !64
116 br i1 %cmp, label %for.body, label %for.cond.cleanup, !dbg !65
118 for.cond.cleanup: ; preds = %for.cond
119 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 3, i32 0, i64 -1), !dbg !67
120 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 11, i32 0, i64 -1), !dbg !68
123 for.body: ; preds = %for.cond
124 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 4, i32 0, i64 -1), !dbg !69
125 call void @llvm.dbg.value(metadata i32 0, metadata !55, metadata !DIExpression()), !dbg !70
126 br label %for.cond1, !dbg !71
128 for.cond1: ; preds = %for.body4, %for.body
129 %a.0 = phi i32 [ 0, %for.body ], [ %inc, %for.body4 ], !dbg !70
130 call void @llvm.dbg.value(metadata i32 %a.0, metadata !55, metadata !DIExpression()), !dbg !70
131 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 5, i32 0, i64 -1), !dbg !72
132 %cmp2 = icmp ult i32 %a.0, 10000, !dbg !75
133 br i1 %cmp2, label %for.body4, label %for.cond.cleanup3, !dbg !76
135 for.cond.cleanup3: ; preds = %for.cond1
136 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 6, i32 0, i64 -1), !dbg !67
137 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 9, i32 0, i64 -1), !dbg !78
138 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 10, i32 0, i64 -1), !dbg !79
139 %inc8 = add nuw nsw i32 %i.0, 1, !dbg !79
140 call void @llvm.dbg.value(metadata i32 %inc8, metadata !53, metadata !DIExpression()), !dbg !60
141 br label %for.cond, !dbg !81, !llvm.loop !82
143 for.body4: ; preds = %for.cond1
144 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 7, i32 0, i64 -1), !dbg !86
145 %0 = load volatile i32, ptr @x, align 4, !dbg !86, !tbaa !27
146 %call = call i32 @matched(i32 noundef %0), !dbg !88
147 store volatile i32 %call, ptr @x, align 4, !dbg !90, !tbaa !27
148 %1 = load volatile i32, ptr @x, align 4, !dbg !91, !tbaa !27
149 %call5 = call i32 @foo(i32 noundef %1), !dbg !92
150 store volatile i32 %call5, ptr @x, align 4, !dbg !94, !tbaa !27
151 %2 = load volatile i32, ptr @x, align 4, !dbg !95, !tbaa !27
152 %call6 = call i32 @bar(i32 noundef %2), !dbg !96
153 store volatile i32 %call6, ptr @x, align 4, !dbg !98, !tbaa !27
154 call void @llvm.pseudoprobe(i64 -2624081020897602054, i64 8, i32 0, i64 -1), !dbg !99
155 %inc = add nuw nsw i32 %a.0, 1, !dbg !99
156 call void @llvm.dbg.value(metadata i32 %inc, metadata !55, metadata !DIExpression()), !dbg !70
157 br label %for.cond1, !dbg !101, !llvm.loop !102
160 ; Function Attrs: inaccessiblememonly mustprogress nocallback nofree nosync nounwind willreturn
161 declare void @llvm.pseudoprobe(i64, i64, i32, i64) #4
163 ; Function Attrs: nocallback nofree nosync nounwind readnone speculatable willreturn
164 declare void @llvm.dbg.value(metadata, metadata, metadata) #5
166 attributes #0 = { nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
167 attributes #1 = { mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn }
168 attributes #2 = { argmemonly mustprogress nocallback nofree nosync nounwind willreturn }
169 attributes #3 = { noinline nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
170 attributes #4 = { inaccessiblememonly mustprogress nocallback nofree nosync nounwind willreturn }
171 attributes #5 = { nocallback nofree nosync nounwind readnone speculatable willreturn }
174 !llvm.module.flags = !{!7, !8, !9, !10}
176 !llvm.pseudo_probe_desc = !{!12, !13, !14, !15}
178 !0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
179 !1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true)
180 !2 = distinct !DICompileUnit(language: DW_LANG_C99, file: !3, producer: "", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None)
181 !3 = !DIFile(filename: "test.c", directory: "")
183 !5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6)
184 !6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
185 !7 = !{i32 7, !"Dwarf Version", i32 5}
186 !8 = !{i32 2, !"Debug Info Version", i32 3}
187 !9 = !{i32 1, !"wchar_size", i32 4}
188 !10 = !{i32 7, !"uwtable", i32 2}
190 !12 = !{i64 6699318081062747564, i64 4294967295, !"foo"}
191 !13 = !{i64 -2012135647395072713, i64 4294967295, !"bar"}
192 !14 = !{i64 -5844448289301669773, i64 4294967295, !"matched"}
193 !15 = !{i64 -2624081020897602054, i64 844635331715433, !"main"}
194 !16 = distinct !DISubprogram(name: "foo", scope: !3, file: !3, line: 2, type: !17, scopeLine: 2, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !19)
195 !17 = !DISubroutineType(types: !18)
198 !20 = !DILocalVariable(name: "x", arg: 1, scope: !16, file: !3, line: 2, type: !6)
199 !21 = !DILocalVariable(name: "y", scope: !16, file: !3, line: 3, type: !5)
200 !22 = !DILocation(line: 0, scope: !16)
201 !23 = !DILocation(line: 3, column: 3, scope: !16)
202 !24 = !DILocation(line: 3, column: 16, scope: !16)
203 !25 = !DILocation(line: 3, column: 20, scope: !16)
204 !26 = !DILocation(line: 3, column: 22, scope: !16)
205 !27 = !{!28, !28, i64 0}
206 !28 = !{!"int", !29, i64 0}
207 !29 = !{!"omnipotent char", !30, i64 0}
208 !30 = !{!"Simple C/C++ TBAA"}
209 !31 = !DILocation(line: 4, column: 10, scope: !16)
210 !32 = !DILocation(line: 4, column: 12, scope: !16)
211 !33 = !DILocation(line: 5, column: 1, scope: !16)
212 !34 = !DILocation(line: 4, column: 3, scope: !16)
213 !35 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 7, type: !17, scopeLine: 7, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !36)
215 !37 = !DILocalVariable(name: "x", arg: 1, scope: !35, file: !3, line: 7, type: !6)
216 !38 = !DILocation(line: 0, scope: !35)
217 !39 = !DILocation(line: 8, column: 10, scope: !35)
218 !40 = !DILocation(line: 8, column: 12, scope: !35)
219 !41 = !DILocation(line: 8, column: 3, scope: !35)
220 !42 = distinct !DISubprogram(name: "matched", scope: !3, file: !3, line: 11, type: !17, scopeLine: 11, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !43)
222 !44 = !DILocalVariable(name: "x", arg: 1, scope: !42, file: !3, line: 11, type: !6)
223 !45 = !DILocation(line: 0, scope: !42)
224 !46 = !DILocation(line: 12, column: 10, scope: !42)
225 !47 = !DILocation(line: 12, column: 12, scope: !42)
226 !48 = !DILocation(line: 12, column: 3, scope: !42)
227 !49 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 15, type: !50, scopeLine: 15, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !52)
228 !50 = !DISubroutineType(types: !51)
231 !53 = !DILocalVariable(name: "i", scope: !54, file: !3, line: 16, type: !6)
232 !54 = distinct !DILexicalBlock(scope: !49, file: !3, line: 16, column: 3)
233 !55 = !DILocalVariable(name: "a", scope: !56, file: !3, line: 17, type: !6)
234 !56 = distinct !DILexicalBlock(scope: !57, file: !3, line: 17, column: 5)
235 !57 = distinct !DILexicalBlock(scope: !58, file: !3, line: 16, column: 34)
236 !58 = distinct !DILexicalBlock(scope: !54, file: !3, line: 16, column: 3)
237 !59 = !DILocation(line: 16, column: 12, scope: !54)
238 !60 = !DILocation(line: 0, scope: !54)
239 !61 = !DILocation(line: 16, column: 8, scope: !54)
240 !62 = !DILocation(line: 16, column: 19, scope: !63)
241 !63 = !DILexicalBlockFile(scope: !58, file: !3, discriminator: 0)
242 !64 = !DILocation(line: 16, column: 21, scope: !63)
243 !65 = !DILocation(line: 16, column: 3, scope: !66)
244 !66 = !DILexicalBlockFile(scope: !54, file: !3, discriminator: 0)
245 !67 = !DILocation(line: 0, scope: !49)
246 !68 = !DILocation(line: 23, column: 1, scope: !49)
247 !69 = !DILocation(line: 17, column: 14, scope: !56)
248 !70 = !DILocation(line: 0, scope: !56)
249 !71 = !DILocation(line: 17, column: 10, scope: !56)
250 !72 = !DILocation(line: 17, column: 21, scope: !73)
251 !73 = !DILexicalBlockFile(scope: !74, file: !3, discriminator: 0)
252 !74 = distinct !DILexicalBlock(scope: !56, file: !3, line: 17, column: 5)
253 !75 = !DILocation(line: 17, column: 23, scope: !73)
254 !76 = !DILocation(line: 17, column: 5, scope: !77)
255 !77 = !DILexicalBlockFile(scope: !56, file: !3, discriminator: 0)
256 !78 = !DILocation(line: 22, column: 3, scope: !57)
257 !79 = !DILocation(line: 16, column: 30, scope: !80)
258 !80 = !DILexicalBlockFile(scope: !58, file: !3, discriminator: 0)
259 !81 = !DILocation(line: 16, column: 3, scope: !80)
260 !82 = distinct !{!82, !83, !84, !85}
261 !83 = !DILocation(line: 16, column: 3, scope: !54)
262 !84 = !DILocation(line: 22, column: 3, scope: !54)
263 !85 = !{!"llvm.loop.mustprogress"}
264 !86 = !DILocation(line: 18, column: 19, scope: !87)
265 !87 = distinct !DILexicalBlock(scope: !74, file: !3, line: 17, column: 37)
266 !88 = !DILocation(line: 18, column: 11, scope: !89)
267 !89 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646631)
268 !90 = !DILocation(line: 18, column: 9, scope: !87)
269 !91 = !DILocation(line: 19, column: 15, scope: !87)
270 !92 = !DILocation(line: 19, column: 11, scope: !93)
271 !93 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646639)
272 !94 = !DILocation(line: 19, column: 9, scope: !87)
273 !95 = !DILocation(line: 20, column: 15, scope: !87)
274 !96 = !DILocation(line: 20, column: 11, scope: !97)
275 !97 = !DILexicalBlockFile(scope: !87, file: !3, discriminator: 186646647)
276 !98 = !DILocation(line: 20, column: 9, scope: !87)
277 !99 = !DILocation(line: 17, column: 33, scope: !100)
278 !100 = !DILexicalBlockFile(scope: !74, file: !3, discriminator: 0)
279 !101 = !DILocation(line: 17, column: 5, scope: !100)
280 !102 = distinct !{!102, !103, !104, !85}
281 !103 = !DILocation(line: 17, column: 5, scope: !56)
282 !104 = !DILocation(line: 21, column: 5, scope: !56)