1 ; REQUIRES: x86_64-linux
2 ; RUN: opt < %s -passes=sample-profile -sample-profile-file=%S/Inputs/profile-mismatch.prof -report-profile-staleness -persist-profile-staleness -S 2>%t -o %t.ll
3 ; RUN: FileCheck %s --input-file %t
4 ; RUN: FileCheck %s --input-file %t.ll -check-prefix=CHECK-MD
5 ; RUN: llc < %t.ll -filetype=obj -o %t.obj
6 ; RUN: llvm-objdump --section-headers %t.obj | FileCheck %s --check-prefix=CHECK-OBJ
7 ; RUN: llc < %t.ll -filetype=asm -o - | FileCheck %s --check-prefix=CHECK-ASM
9 ; CHECK: (2/3) of callsites' profile are invalid and (25/35) of samples are discarded due to callsite location mismatch.
11 ; CHECK-MD: ![[#]] = !{!"NumMismatchedCallsites", i64 2, !"TotalProfiledCallsites", i64 3, !"MismatchedCallsiteSamples", i64 25, !"TotalCallsiteSamples", i64 35}
13 ; CHECK-OBJ: .llvm_stats
15 ; CHECK-ASM: .section .llvm_stats,"",@progbits
17 ; CHECK-ASM: .ascii "NumMismatchedCallsites"
19 ; CHECK-ASM: .ascii "Mg=="
21 ; CHECK-ASM: .ascii "TotalProfiledCallsites"
23 ; CHECK-ASM: .ascii "Mw=="
25 ; CHECK-ASM: .ascii "MismatchedCallsiteSamples"
27 ; CHECK-ASM: .ascii "MjU="
29 ; CHECK-ASM: .ascii "TotalCallsiteSamples"
31 ; CHECK-ASM: .ascii "MzU="
33 target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
34 target triple = "x86_64-unknown-linux-gnu"
36 @x = dso_local global i32 0, align 4, !dbg !0
38 ; Function Attrs: nounwind uwtable
39 define dso_local i32 @foo(i32 noundef %x) #0 !dbg !12 {
41 %y = alloca i32, align 4
42 call void @llvm.dbg.value(metadata i32 %x, metadata !16, metadata !DIExpression()), !dbg !18
43 call void @llvm.lifetime.start.p0(i64 4, ptr nonnull %y), !dbg !19
44 call void @llvm.dbg.declare(metadata ptr %y, metadata !17, metadata !DIExpression()), !dbg !20
45 %add = add nsw i32 %x, 1, !dbg !21
46 store volatile i32 %add, ptr %y, align 4, !dbg !20, !tbaa !22
47 %y.0. = load volatile i32, ptr %y, align 4, !dbg !26, !tbaa !22
48 %add1 = add nsw i32 %y.0., 1, !dbg !27
49 call void @llvm.lifetime.end.p0(i64 4, ptr nonnull %y), !dbg !28
50 ret i32 %add1, !dbg !29
53 ; Function Attrs: mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn
54 declare void @llvm.dbg.declare(metadata, metadata, metadata) #1
56 ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
57 declare void @llvm.lifetime.start.p0(i64 immarg, ptr nocapture) #2
59 ; Function Attrs: argmemonly mustprogress nocallback nofree nosync nounwind willreturn
60 declare void @llvm.lifetime.end.p0(i64 immarg, ptr nocapture) #2
62 ; Function Attrs: noinline nounwind uwtable
63 define dso_local i32 @bar(i32 noundef %x) #3 !dbg !30 {
65 call void @llvm.dbg.value(metadata i32 %x, metadata !32, metadata !DIExpression()), !dbg !33
66 %add = add nsw i32 %x, 2, !dbg !34
67 ret i32 %add, !dbg !35
70 ; Function Attrs: noinline nounwind uwtable
71 define dso_local i32 @matched(i32 noundef %x) #3 !dbg !36 {
73 call void @llvm.dbg.value(metadata i32 %x, metadata !38, metadata !DIExpression()), !dbg !39
74 %add = add nsw i32 %x, 3, !dbg !40
75 ret i32 %add, !dbg !41
78 ; Function Attrs: nounwind uwtable
79 define dso_local i32 @main() #0 !dbg !42 {
81 call void @llvm.dbg.value(metadata i32 0, metadata !46, metadata !DIExpression()), !dbg !52
82 br label %for.cond, !dbg !53
84 for.cond: ; preds = %for.cond.cleanup3, %entry
85 %i.0 = phi i32 [ 0, %entry ], [ %inc8, %for.cond.cleanup3 ], !dbg !52
86 call void @llvm.dbg.value(metadata i32 %i.0, metadata !46, metadata !DIExpression()), !dbg !52
87 %cmp = icmp ult i32 %i.0, 1000, !dbg !54
88 br i1 %cmp, label %for.body, label %for.cond.cleanup, !dbg !56
90 for.cond.cleanup: ; preds = %for.cond
93 for.body: ; preds = %for.cond
94 call void @llvm.dbg.value(metadata i32 0, metadata !48, metadata !DIExpression()), !dbg !59
95 br label %for.cond1, !dbg !60
97 for.cond1: ; preds = %for.body4, %for.body
98 %a.0 = phi i32 [ 0, %for.body ], [ %inc, %for.body4 ], !dbg !59
99 call void @llvm.dbg.value(metadata i32 %a.0, metadata !48, metadata !DIExpression()), !dbg !59
100 %cmp2 = icmp ult i32 %a.0, 10000, !dbg !61
101 br i1 %cmp2, label %for.body4, label %for.cond.cleanup3, !dbg !64
103 for.cond.cleanup3: ; preds = %for.cond1
104 %inc8 = add nuw nsw i32 %i.0, 1, !dbg !66
105 call void @llvm.dbg.value(metadata i32 %inc8, metadata !46, metadata !DIExpression()), !dbg !52
106 br label %for.cond, !dbg !68, !llvm.loop !69
108 for.body4: ; preds = %for.cond1
109 %0 = load volatile i32, ptr @x, align 4, !dbg !73, !tbaa !22
110 %call = call i32 @matched(i32 noundef %0), !dbg !75
111 store volatile i32 %call, ptr @x, align 4, !dbg !76, !tbaa !22
112 %1 = load volatile i32, ptr @x, align 4, !dbg !77, !tbaa !22
113 %call5 = call i32 @foo(i32 noundef %1), !dbg !78
114 store volatile i32 %call5, ptr @x, align 4, !dbg !79, !tbaa !22
115 %2 = load volatile i32, ptr @x, align 4, !dbg !80, !tbaa !22
116 %call6 = call i32 @bar(i32 noundef %2), !dbg !81
117 store volatile i32 %call6, ptr @x, align 4, !dbg !82, !tbaa !22
118 %inc = add nuw nsw i32 %a.0, 1, !dbg !83
119 call void @llvm.dbg.value(metadata i32 %inc, metadata !48, metadata !DIExpression()), !dbg !59
120 br label %for.cond1, !dbg !85, !llvm.loop !86
123 ; Function Attrs: nocallback nofree nosync nounwind readnone speculatable willreturn
124 declare void @llvm.dbg.value(metadata, metadata, metadata) #4
126 attributes #0 = { nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
127 attributes #1 = { mustprogress nocallback nofree nosync nounwind readnone speculatable willreturn }
128 attributes #2 = { argmemonly mustprogress nocallback nofree nosync nounwind willreturn }
129 attributes #3 = { noinline nounwind uwtable "frame-pointer"="none" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+cx8,+fxsr,+mmx,+sse,+sse2,+x87" "tune-cpu"="generic" "use-sample-profile" }
130 attributes #4 = { nocallback nofree nosync nounwind readnone speculatable willreturn }
133 !llvm.module.flags = !{!7, !8, !9, !10}
136 !0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
137 !1 = distinct !DIGlobalVariable(name: "x", scope: !2, file: !3, line: 1, type: !5, isLocal: false, isDefinition: true)
138 !2 = distinct !DICompileUnit(language: DW_LANG_C99, file: !3, producer: "clang", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, debugInfoForProfiling: true, nameTableKind: None)
139 !3 = !DIFile(filename: "test.c", directory: "test")
141 !5 = !DIDerivedType(tag: DW_TAG_volatile_type, baseType: !6)
142 !6 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
143 !7 = !{i32 7, !"Dwarf Version", i32 5}
144 !8 = !{i32 2, !"Debug Info Version", i32 3}
145 !9 = !{i32 1, !"wchar_size", i32 4}
146 !10 = !{i32 7, !"uwtable", i32 2}
148 !12 = distinct !DISubprogram(name: "foo", scope: !3, file: !3, line: 2, type: !13, scopeLine: 2, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !15)
149 !13 = !DISubroutineType(types: !14)
152 !16 = !DILocalVariable(name: "x", arg: 1, scope: !12, file: !3, line: 2, type: !6)
153 !17 = !DILocalVariable(name: "y", scope: !12, file: !3, line: 3, type: !5)
154 !18 = !DILocation(line: 0, scope: !12)
155 !19 = !DILocation(line: 3, column: 3, scope: !12)
156 !20 = !DILocation(line: 3, column: 16, scope: !12)
157 !21 = !DILocation(line: 3, column: 22, scope: !12)
158 !22 = !{!23, !23, i64 0}
159 !23 = !{!"int", !24, i64 0}
160 !24 = !{!"omnipotent char", !25, i64 0}
161 !25 = !{!"Simple C/C++ TBAA"}
162 !26 = !DILocation(line: 4, column: 10, scope: !12)
163 !27 = !DILocation(line: 4, column: 12, scope: !12)
164 !28 = !DILocation(line: 5, column: 1, scope: !12)
165 !29 = !DILocation(line: 4, column: 3, scope: !12)
166 !30 = distinct !DISubprogram(name: "bar", scope: !3, file: !3, line: 7, type: !13, scopeLine: 7, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !31)
168 !32 = !DILocalVariable(name: "x", arg: 1, scope: !30, file: !3, line: 7, type: !6)
169 !33 = !DILocation(line: 0, scope: !30)
170 !34 = !DILocation(line: 8, column: 12, scope: !30)
171 !35 = !DILocation(line: 8, column: 3, scope: !30)
172 !36 = distinct !DISubprogram(name: "matched", scope: !3, file: !3, line: 11, type: !13, scopeLine: 11, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !37)
174 !38 = !DILocalVariable(name: "x", arg: 1, scope: !36, file: !3, line: 11, type: !6)
175 !39 = !DILocation(line: 0, scope: !36)
176 !40 = !DILocation(line: 12, column: 12, scope: !36)
177 !41 = !DILocation(line: 12, column: 3, scope: !36)
178 !42 = distinct !DISubprogram(name: "main", scope: !3, file: !3, line: 15, type: !43, scopeLine: 15, flags: DIFlagPrototyped | DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition | DISPFlagOptimized, unit: !2, retainedNodes: !45)
179 !43 = !DISubroutineType(types: !44)
182 !46 = !DILocalVariable(name: "i", scope: !47, file: !3, line: 16, type: !6)
183 !47 = distinct !DILexicalBlock(scope: !42, file: !3, line: 16, column: 3)
184 !48 = !DILocalVariable(name: "a", scope: !49, file: !3, line: 17, type: !6)
185 !49 = distinct !DILexicalBlock(scope: !50, file: !3, line: 17, column: 5)
186 !50 = distinct !DILexicalBlock(scope: !51, file: !3, line: 16, column: 34)
187 !51 = distinct !DILexicalBlock(scope: !47, file: !3, line: 16, column: 3)
188 !52 = !DILocation(line: 0, scope: !47)
189 !53 = !DILocation(line: 16, column: 8, scope: !47)
190 !54 = !DILocation(line: 16, column: 21, scope: !55)
191 !55 = !DILexicalBlockFile(scope: !51, file: !3, discriminator: 2)
192 !56 = !DILocation(line: 16, column: 3, scope: !57)
193 !57 = !DILexicalBlockFile(scope: !47, file: !3, discriminator: 2)
194 !58 = !DILocation(line: 23, column: 1, scope: !42)
195 !59 = !DILocation(line: 0, scope: !49)
196 !60 = !DILocation(line: 17, column: 10, scope: !49)
197 !61 = !DILocation(line: 17, column: 23, scope: !62)
198 !62 = !DILexicalBlockFile(scope: !63, file: !3, discriminator: 2)
199 !63 = distinct !DILexicalBlock(scope: !49, file: !3, line: 17, column: 5)
200 !64 = !DILocation(line: 17, column: 5, scope: !65)
201 !65 = !DILexicalBlockFile(scope: !49, file: !3, discriminator: 2)
202 !66 = !DILocation(line: 16, column: 30, scope: !67)
203 !67 = !DILexicalBlockFile(scope: !51, file: !3, discriminator: 4)
204 !68 = !DILocation(line: 16, column: 3, scope: !67)
205 !69 = distinct !{!69, !70, !71, !72}
206 !70 = !DILocation(line: 16, column: 3, scope: !47)
207 !71 = !DILocation(line: 22, column: 3, scope: !47)
208 !72 = !{!"llvm.loop.mustprogress"}
209 !73 = !DILocation(line: 18, column: 19, scope: !74)
210 !74 = distinct !DILexicalBlock(scope: !63, file: !3, line: 17, column: 37)
211 !75 = !DILocation(line: 18, column: 11, scope: !74)
212 !76 = !DILocation(line: 18, column: 9, scope: !74)
213 !77 = !DILocation(line: 19, column: 15, scope: !74)
214 !78 = !DILocation(line: 19, column: 11, scope: !74)
215 !79 = !DILocation(line: 19, column: 9, scope: !74)
216 !80 = !DILocation(line: 20, column: 15, scope: !74)
217 !81 = !DILocation(line: 20, column: 11, scope: !74)
218 !82 = !DILocation(line: 20, column: 9, scope: !74)
219 !83 = !DILocation(line: 17, column: 33, scope: !84)
220 !84 = !DILexicalBlockFile(scope: !63, file: !3, discriminator: 4)
221 !85 = !DILocation(line: 17, column: 5, scope: !84)
222 !86 = distinct !{!86, !87, !88, !72}
223 !87 = !DILocation(line: 17, column: 5, scope: !49)
224 !88 = !DILocation(line: 21, column: 5, scope: !49)