1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -mattr=sse -enable-unsafe-fp-math < %s | FileCheck %s
4 ; The debug info in this test case was causing a crash because machine trace metrics
5 ; did not correctly ignore debug instructions. The check lines ensure that the
6 ; machine-combiner pass has run, reassociated the add operands, and therefore
7 ; used machine trace metrics.
9 define void @PR24199() {
10 ; CHECK-LABEL: PR24199:
11 ; CHECK: # %bb.0: # %entry
12 ; CHECK-NEXT: subq $24, %rsp
13 ; CHECK-NEXT: .cfi_def_cfa_offset 32
14 ; CHECK-NEXT: xorl %eax, %eax
15 ; CHECK-NEXT: testb %al, %al
16 ; CHECK-NEXT: je .LBB0_2
17 ; CHECK-NEXT: # %bb.1:
18 ; CHECK-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
19 ; CHECK-NEXT: jmp .LBB0_3
20 ; CHECK-NEXT: .LBB0_2: # %if.then
21 ; CHECK-NEXT: xorps %xmm0, %xmm0
22 ; CHECK-NEXT: .LBB0_3: # %if.end
23 ; CHECK-NEXT: movss %xmm0, {{[-0-9]+}}(%r{{[sb]}}p) # 4-byte Spill
24 ; CHECK-NEXT: callq foo
25 ; CHECK-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
26 ; CHECK-NEXT: movss {{[-0-9]+}}(%r{{[sb]}}p), %xmm2 # 4-byte Reload
27 ; CHECK-NEXT: # xmm2 = mem[0],zero,zero,zero
28 ; CHECK-NEXT: mulss %xmm0, %xmm2
29 ; CHECK-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero
30 ; CHECK-NEXT: addss %xmm1, %xmm0
31 ; CHECK-NEXT: addss %xmm2, %xmm0
32 ; CHECK-NEXT: movss %xmm0, (%rax)
33 ; CHECK-NEXT: testl %eax, %eax
34 ; CHECK-NEXT: jne .LBB0_5
35 ; CHECK-NEXT: # %bb.4: # %if.end
36 ; CHECK-NEXT: xorps %xmm1, %xmm1
37 ; CHECK-NEXT: .LBB0_5: # %if.end
38 ; CHECK-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
39 ; CHECK-NEXT: addss %xmm0, %xmm0
40 ; CHECK-NEXT: addss %xmm1, %xmm0
41 ; CHECK-NEXT: callq bar
42 ; CHECK-NEXT: addq $24, %rsp
43 ; CHECK-NEXT: .cfi_def_cfa_offset 8
47 %i = alloca %struct.A, align 8
48 %tobool = icmp ne i32 undef, 0
49 br i1 undef, label %if.end, label %if.then
55 %h = phi float [ 0.0, %if.then ], [ 4.0, %entry ]
56 call void @foo(%struct.A* nonnull undef)
57 tail call void @llvm.dbg.value(metadata %struct.A* undef, i64 0, metadata !5, metadata !4), !dbg !6
58 tail call void @llvm.dbg.value(metadata float %h, i64 0, metadata !5, metadata !4), !dbg !6
59 %n0 = load float, float* undef, align 4
60 %mul = fmul fast float %n0, %h
61 %add = fadd fast float %mul, 1.0
62 tail call void @llvm.dbg.value(metadata %struct.A* undef, i64 0, metadata !5, metadata !4), !dbg !6
63 tail call void @llvm.dbg.value(metadata float %add, i64 0, metadata !5, metadata !4), !dbg !6
64 %add.i = fadd fast float %add, %n0
65 store float %add.i, float* undef, align 4
66 %n1 = bitcast %struct.A* %i to i8*
67 call void @llvm.lifetime.start.p0i8(i64 16, i8* %n1)
68 %n2 = load <2 x float>, <2 x float>* undef, align 8
69 %conv = uitofp i1 %tobool to float
70 %bitcast = extractelement <2 x float> %n2, i32 0
71 %factor = fmul fast float %bitcast, 2.0
72 %add3 = fadd fast float %factor, %conv
73 call void @bar(float %add3)
77 %struct.A = type { float, float }
79 declare void @bar(float)
80 declare void @foo(%struct.A*)
81 declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture)
82 declare void @llvm.dbg.value(metadata, i64, metadata, metadata)
85 !llvm.module.flags = !{!2}
87 !0 = distinct !DICompileUnit(language: DW_LANG_C_plus_plus, file: !1, isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug)
88 !1 = !DIFile(filename: "24199.cpp", directory: "/bin")
89 !2 = !{i32 2, !"Debug Info Version", i32 3}
90 !3 = distinct !DISubprogram(linkageName: "foo", file: !1, line: 18, isLocal: false, isDefinition: true, scopeLine: 18, unit: !0)
92 !5 = !DILocalVariable(name: "this", arg: 1, scope: !3, flags: DIFlagArtificial | DIFlagObjectPointer)
93 !6 = !DILocation(line: 0, scope: !3)