1 ; RUN: llc -verify-machineinstrs -mcpu=pwr7 -disable-ppc-instr-form-prep < %s | FileCheck %s
2 ; RUN: llc -verify-machineinstrs -mcpu=pwr7 < %s | FileCheck %s -check-prefix=PIP
3 target datalayout = "E-m:e-i64:64-n32:64"
4 target triple = "powerpc64-unknown-linux-gnu"
6 ; Function Attrs: nounwind
7 define double @foo() #1 {
9 %x = alloca [2048 x float], align 4
10 %y = alloca [2048 x float], align 4
11 %0 = bitcast [2048 x float]* %x to i8*
12 call void @llvm.lifetime.start.p0i8(i64 8192, i8* %0) #2
13 %1 = bitcast [2048 x float]* %y to i8*
14 call void @llvm.lifetime.start.p0i8(i64 8192, i8* %1) #2
18 ; CHECK: addi [[REG1:[0-9]+]], 1,
19 ; CHECK: addi [[REG2:[0-9]+]], 1,
20 ; CHECK: li [[REG3:[0-9]+]], 0
22 ; CHECK-DAG: lfsx {{[0-9]+}}, [[REG1]], [[REG3]]
23 ; CHECK-DAG: lfsx {{[0-9]+}}, [[REG2]], [[REG3]]
27 ; PIP: addi [[REG1:[0-9]+]], 1,
28 ; PIP: addi [[REG2:[0-9]+]], 1,
30 ; PIP-DAG: lfsu {{[0-9]+}}, 4([[REG1]])
31 ; PIP-DAG: lfsu {{[0-9]+}}, 4([[REG2]])
34 for.body.i: ; preds = %for.body.i.preheader, %for.body.i
35 %accumulator.09.i = phi double [ %add.i, %for.body.i ], [ 0.000000e+00, %entry ]
36 %i.08.i = phi i64 [ %inc.i, %for.body.i ], [ 0, %entry ]
37 %arrayidx.i = getelementptr inbounds [2048 x float], [2048 x float]* %x, i64 0, i64 %i.08.i
38 %v14 = load float, float* %arrayidx.i, align 4
39 %conv.i = fpext float %v14 to double
40 %arrayidx1.i = getelementptr inbounds [2048 x float], [2048 x float]* %y, i64 0, i64 %i.08.i
41 %v15 = load float, float* %arrayidx1.i, align 4
42 %conv2.i = fpext float %v15 to double
43 %mul.i = fmul double %conv.i, %conv2.i
44 %add.i = fadd double %accumulator.09.i, %mul.i
45 %inc.i = add nuw nsw i64 %i.08.i, 1
46 %exitcond.i = icmp eq i64 %i.08.i, 2047
47 br i1 %exitcond.i, label %loop.exit, label %for.body.i
49 loop.exit: ; preds = %for.body.i
50 ret double %accumulator.09.i
53 ; Function Attrs: nounwind
54 declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) #2
56 declare void @bar(float*, float*)
58 ; Function Attrs: nounwind
59 declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) #2
61 attributes #0 = { nounwind readonly }
62 attributes #1 = { nounwind }
63 attributes #2 = { nounwind }