test/CodeGen/PowerPC/2011-12-06-SpillAndRestoreCR.ll

   1 ; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc-unknown-linux-gnu -mcpu=g4 | FileCheck %s
   2 ; RUN: llc -verify-machineinstrs < %s -mtriple=powerpc64-unknown-linux-gnu -mcpu=g4 | FileCheck %s
   3
   4 ; ModuleID = 'tsc.c'
   5 target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v128:128:128-n32:64"
   6 target triple = "powerpc64-unknown-linux-gnu"
   7
   8 @a = common global [32000 x float] zeroinitializer, align 16
   9 @b = common global [32000 x float] zeroinitializer, align 16
  10 @c = common global [32000 x float] zeroinitializer, align 16
  11 @d = common global [32000 x float] zeroinitializer, align 16
  12 @e = common global [32000 x float] zeroinitializer, align 16
  13 @aa = common global [256 x [256 x float]] zeroinitializer, align 16
  14 @bb = common global [256 x [256 x float]] zeroinitializer, align 16
  15 @cc = common global [256 x [256 x float]] zeroinitializer, align 16
  16 @temp = common global float 0.000000e+00, align 4
  17
  18 @.str81 = private unnamed_addr constant [6 x i8] c"s3110\00", align 1
  19 @.str235 = private unnamed_addr constant [15 x i8] c"S3110\09 %.2f \09\09\00", align 1
  20
  21 declare i32 @printf(i8* nocapture, ...) nounwind
  22 declare i32 @init(i8* %name) nounwind
  23 declare i64 @clock() nounwind
  24 declare i32 @dummy(float*, float*, float*, float*, float*, [256 x float]*, [256 x float]*, [256 x float]*, float)
  25 declare void @check(i32 %name) nounwind
  26
  27 ; CHECK: mfcr
  28 ; CHECK: mtcr
  29
  30 define i32 @s3110() nounwind {
  31 entry:
  32   %call = tail call i32 @init(i8* getelementptr inbounds ([6 x i8], [6 x i8]* @.str81, i64 0, i64 0))
  33   %call1 = tail call i64 @clock() nounwind
  34   br label %for.body
  35
  36 for.body:                                         ; preds = %for.end17, %entry
  37   %nl.041 = phi i32 [ 0, %entry ], [ %inc22, %for.end17 ]
  38   %0 = load float, float* getelementptr inbounds ([256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 0, i64 0), align 16
  39   br label %for.cond5.preheader
  40
  41 for.cond5.preheader:                              ; preds = %for.inc15, %for.body
  42   %indvars.iv42 = phi i64 [ 0, %for.body ], [ %indvars.iv.next43, %for.inc15 ]
  43   %max.139 = phi float [ %0, %for.body ], [ %max.3.15, %for.inc15 ]
  44   %xindex.138 = phi i32 [ 0, %for.body ], [ %xindex.3.15, %for.inc15 ]
  45   %yindex.137 = phi i32 [ 0, %for.body ], [ %yindex.3.15, %for.inc15 ]
  46   br label %for.body7
  47
  48 for.body7:                                        ; preds = %for.body7, %for.cond5.preheader
  49   %indvars.iv = phi i64 [ 0, %for.cond5.preheader ], [ %indvars.iv.next.15, %for.body7 ]
  50   %max.235 = phi float [ %max.139, %for.cond5.preheader ], [ %max.3.15, %for.body7 ]
  51   %xindex.234 = phi i32 [ %xindex.138, %for.cond5.preheader ], [ %xindex.3.15, %for.body7 ]
  52   %yindex.233 = phi i32 [ %yindex.137, %for.cond5.preheader ], [ %yindex.3.15, %for.body7 ]
  53   %arrayidx9 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv
  54   %1 = load float, float* %arrayidx9, align 16
  55   %cmp10 = fcmp ogt float %1, %max.235
  56   %2 = trunc i64 %indvars.iv to i32
  57   %yindex.3 = select i1 %cmp10, i32 %2, i32 %yindex.233
  58   %3 = trunc i64 %indvars.iv42 to i32
  59   %xindex.3 = select i1 %cmp10, i32 %3, i32 %xindex.234
  60   %max.3 = select i1 %cmp10, float %1, float %max.235
  61   %indvars.iv.next45 = or i64 %indvars.iv, 1
  62   %arrayidx9.1 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next45
  63   %4 = load float, float* %arrayidx9.1, align 4
  64   %cmp10.1 = fcmp ogt float %4, %max.3
  65   %5 = trunc i64 %indvars.iv.next45 to i32
  66   %yindex.3.1 = select i1 %cmp10.1, i32 %5, i32 %yindex.3
  67   %xindex.3.1 = select i1 %cmp10.1, i32 %3, i32 %xindex.3
  68   %max.3.1 = select i1 %cmp10.1, float %4, float %max.3
  69   %indvars.iv.next.146 = or i64 %indvars.iv, 2
  70   %arrayidx9.2 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.146
  71   %6 = load float, float* %arrayidx9.2, align 8
  72   %cmp10.2 = fcmp ogt float %6, %max.3.1
  73   %7 = trunc i64 %indvars.iv.next.146 to i32
  74   %yindex.3.2 = select i1 %cmp10.2, i32 %7, i32 %yindex.3.1
  75   %xindex.3.2 = select i1 %cmp10.2, i32 %3, i32 %xindex.3.1
  76   %max.3.2 = select i1 %cmp10.2, float %6, float %max.3.1
  77   %indvars.iv.next.247 = or i64 %indvars.iv, 3
  78   %arrayidx9.3 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.247
  79   %8 = load float, float* %arrayidx9.3, align 4
  80   %cmp10.3 = fcmp ogt float %8, %max.3.2
  81   %9 = trunc i64 %indvars.iv.next.247 to i32
  82   %yindex.3.3 = select i1 %cmp10.3, i32 %9, i32 %yindex.3.2
  83   %xindex.3.3 = select i1 %cmp10.3, i32 %3, i32 %xindex.3.2
  84   %max.3.3 = select i1 %cmp10.3, float %8, float %max.3.2
  85   %indvars.iv.next.348 = or i64 %indvars.iv, 4
  86   %arrayidx9.4 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.348
  87   %10 = load float, float* %arrayidx9.4, align 16
  88   %cmp10.4 = fcmp ogt float %10, %max.3.3
  89   %11 = trunc i64 %indvars.iv.next.348 to i32
  90   %yindex.3.4 = select i1 %cmp10.4, i32 %11, i32 %yindex.3.3
  91   %xindex.3.4 = select i1 %cmp10.4, i32 %3, i32 %xindex.3.3
  92   %max.3.4 = select i1 %cmp10.4, float %10, float %max.3.3
  93   %indvars.iv.next.449 = or i64 %indvars.iv, 5
  94   %arrayidx9.5 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.449
  95   %12 = load float, float* %arrayidx9.5, align 4
  96   %cmp10.5 = fcmp ogt float %12, %max.3.4
  97   %13 = trunc i64 %indvars.iv.next.449 to i32
  98   %yindex.3.5 = select i1 %cmp10.5, i32 %13, i32 %yindex.3.4
  99   %xindex.3.5 = select i1 %cmp10.5, i32 %3, i32 %xindex.3.4
 100   %max.3.5 = select i1 %cmp10.5, float %12, float %max.3.4
 101   %indvars.iv.next.550 = or i64 %indvars.iv, 6
 102   %arrayidx9.6 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.550
 103   %14 = load float, float* %arrayidx9.6, align 8
 104   %cmp10.6 = fcmp ogt float %14, %max.3.5
 105   %15 = trunc i64 %indvars.iv.next.550 to i32
 106   %yindex.3.6 = select i1 %cmp10.6, i32 %15, i32 %yindex.3.5
 107   %xindex.3.6 = select i1 %cmp10.6, i32 %3, i32 %xindex.3.5
 108   %max.3.6 = select i1 %cmp10.6, float %14, float %max.3.5
 109   %indvars.iv.next.651 = or i64 %indvars.iv, 7
 110   %arrayidx9.7 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.651
 111   %16 = load float, float* %arrayidx9.7, align 4
 112   %cmp10.7 = fcmp ogt float %16, %max.3.6
 113   %17 = trunc i64 %indvars.iv.next.651 to i32
 114   %yindex.3.7 = select i1 %cmp10.7, i32 %17, i32 %yindex.3.6
 115   %xindex.3.7 = select i1 %cmp10.7, i32 %3, i32 %xindex.3.6
 116   %max.3.7 = select i1 %cmp10.7, float %16, float %max.3.6
 117   %indvars.iv.next.752 = or i64 %indvars.iv, 8
 118   %arrayidx9.8 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.752
 119   %18 = load float, float* %arrayidx9.8, align 16
 120   %cmp10.8 = fcmp ogt float %18, %max.3.7
 121   %19 = trunc i64 %indvars.iv.next.752 to i32
 122   %yindex.3.8 = select i1 %cmp10.8, i32 %19, i32 %yindex.3.7
 123   %xindex.3.8 = select i1 %cmp10.8, i32 %3, i32 %xindex.3.7
 124   %max.3.8 = select i1 %cmp10.8, float %18, float %max.3.7
 125   %indvars.iv.next.853 = or i64 %indvars.iv, 9
 126   %arrayidx9.9 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.853
 127   %20 = load float, float* %arrayidx9.9, align 4
 128   %cmp10.9 = fcmp ogt float %20, %max.3.8
 129   %21 = trunc i64 %indvars.iv.next.853 to i32
 130   %yindex.3.9 = select i1 %cmp10.9, i32 %21, i32 %yindex.3.8
 131   %xindex.3.9 = select i1 %cmp10.9, i32 %3, i32 %xindex.3.8
 132   %max.3.9 = select i1 %cmp10.9, float %20, float %max.3.8
 133   %indvars.iv.next.954 = or i64 %indvars.iv, 10
 134   %arrayidx9.10 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.954
 135   %22 = load float, float* %arrayidx9.10, align 8
 136   %cmp10.10 = fcmp ogt float %22, %max.3.9
 137   %23 = trunc i64 %indvars.iv.next.954 to i32
 138   %yindex.3.10 = select i1 %cmp10.10, i32 %23, i32 %yindex.3.9
 139   %xindex.3.10 = select i1 %cmp10.10, i32 %3, i32 %xindex.3.9
 140   %max.3.10 = select i1 %cmp10.10, float %22, float %max.3.9
 141   %indvars.iv.next.1055 = or i64 %indvars.iv, 11
 142   %arrayidx9.11 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.1055
 143   %24 = load float, float* %arrayidx9.11, align 4
 144   %cmp10.11 = fcmp ogt float %24, %max.3.10
 145   %25 = trunc i64 %indvars.iv.next.1055 to i32
 146   %yindex.3.11 = select i1 %cmp10.11, i32 %25, i32 %yindex.3.10
 147   %xindex.3.11 = select i1 %cmp10.11, i32 %3, i32 %xindex.3.10
 148   %max.3.11 = select i1 %cmp10.11, float %24, float %max.3.10
 149   %indvars.iv.next.1156 = or i64 %indvars.iv, 12
 150   %arrayidx9.12 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.1156
 151   %26 = load float, float* %arrayidx9.12, align 16
 152   %cmp10.12 = fcmp ogt float %26, %max.3.11
 153   %27 = trunc i64 %indvars.iv.next.1156 to i32
 154   %yindex.3.12 = select i1 %cmp10.12, i32 %27, i32 %yindex.3.11
 155   %xindex.3.12 = select i1 %cmp10.12, i32 %3, i32 %xindex.3.11
 156   %max.3.12 = select i1 %cmp10.12, float %26, float %max.3.11
 157   %indvars.iv.next.1257 = or i64 %indvars.iv, 13
 158   %arrayidx9.13 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.1257
 159   %28 = load float, float* %arrayidx9.13, align 4
 160   %cmp10.13 = fcmp ogt float %28, %max.3.12
 161   %29 = trunc i64 %indvars.iv.next.1257 to i32
 162   %yindex.3.13 = select i1 %cmp10.13, i32 %29, i32 %yindex.3.12
 163   %xindex.3.13 = select i1 %cmp10.13, i32 %3, i32 %xindex.3.12
 164   %max.3.13 = select i1 %cmp10.13, float %28, float %max.3.12
 165   %indvars.iv.next.1358 = or i64 %indvars.iv, 14
 166   %arrayidx9.14 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.1358
 167   %30 = load float, float* %arrayidx9.14, align 8
 168   %cmp10.14 = fcmp ogt float %30, %max.3.13
 169   %31 = trunc i64 %indvars.iv.next.1358 to i32
 170   %yindex.3.14 = select i1 %cmp10.14, i32 %31, i32 %yindex.3.13
 171   %xindex.3.14 = select i1 %cmp10.14, i32 %3, i32 %xindex.3.13
 172   %max.3.14 = select i1 %cmp10.14, float %30, float %max.3.13
 173   %indvars.iv.next.1459 = or i64 %indvars.iv, 15
 174   %arrayidx9.15 = getelementptr inbounds [256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 %indvars.iv42, i64 %indvars.iv.next.1459
 175   %32 = load float, float* %arrayidx9.15, align 4
 176   %cmp10.15 = fcmp ogt float %32, %max.3.14
 177   %33 = trunc i64 %indvars.iv.next.1459 to i32
 178   %yindex.3.15 = select i1 %cmp10.15, i32 %33, i32 %yindex.3.14
 179   %xindex.3.15 = select i1 %cmp10.15, i32 %3, i32 %xindex.3.14
 180   %max.3.15 = select i1 %cmp10.15, float %32, float %max.3.14
 181   %indvars.iv.next.15 = add i64 %indvars.iv, 16
 182   %lftr.wideiv.15 = trunc i64 %indvars.iv.next.15 to i32
 183   %exitcond.15 = icmp eq i32 %lftr.wideiv.15, 256
 184   br i1 %exitcond.15, label %for.inc15, label %for.body7
 185
 186 for.inc15:                                        ; preds = %for.body7
 187   %indvars.iv.next43 = add i64 %indvars.iv42, 1
 188   %lftr.wideiv = trunc i64 %indvars.iv.next43 to i32
 189   %exitcond = icmp eq i32 %lftr.wideiv, 256
 190   br i1 %exitcond, label %for.end17, label %for.cond5.preheader
 191
 192 for.end17:                                        ; preds = %for.inc15
 193   %conv = sitofp i32 %xindex.3.15 to float
 194   %add = fadd float %max.3.15, %conv
 195   %conv18 = sitofp i32 %yindex.3.15 to float
 196   %add19 = fadd float %add, %conv18
 197   %call20 = tail call i32 @dummy(float* getelementptr inbounds ([32000 x float], [32000 x float]* @a, i64 0, i64 0), float* getelementptr inbounds ([32000 x float], [32000 x float]* @b, i64 0, i64 0), float* getelementptr inbounds ([32000 x float], [32000 x float]* @c, i64 0, i64 0), float* getelementptr inbounds ([32000 x float], [32000 x float]* @d, i64 0, i64 0), float* getelementptr inbounds ([32000 x float], [32000 x float]* @e, i64 0, i64 0), [256 x float]* getelementptr inbounds ([256 x [256 x float]], [256 x [256 x float]]* @aa, i64 0, i64 0), [256 x float]* getelementptr inbounds ([256 x [256 x float]], [256 x [256 x float]]* @bb, i64 0, i64 0), [256 x float]* getelementptr inbounds ([256 x [256 x float]], [256 x [256 x float]]* @cc, i64 0, i64 0), float %add19) nounwind
 198   %inc22 = add nsw i32 %nl.041, 1
 199   %exitcond44 = icmp eq i32 %inc22, 78100
 200   br i1 %exitcond44, label %for.end23, label %for.body
 201
 202 for.end23:                                        ; preds = %for.end17
 203   %call24 = tail call i64 @clock() nounwind
 204   %sub = sub nsw i64 %call24, %call1
 205   %conv25 = sitofp i64 %sub to double
 206   %div = fdiv double %conv25, 1.000000e+06
 207   %call26 = tail call i32 (i8*, ...) @printf(i8* getelementptr inbounds ([15 x i8], [15 x i8]* @.str235, i64 0, i64 0), double %div) nounwind
 208   %add29 = fadd float %add, 1.000000e+00
 209   %add31 = fadd float %add29, %conv18
 210   %add32 = fadd float %add31, 1.000000e+00
 211   store float %add32, float* @temp, align 4
 212   tail call void @check(i32 -1)
 213   ret i32 0
 214 }
 215
 216 declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i1) nounwind
 217
 218 declare i32 @puts(i8* nocapture) nounwind
 219
 220 !3 = !{!"branch_weights", i32 64, i32 4}