test/CodeGen/AMDGPU/debug-value2.ll

   1 ; RUN: llc -mtriple=amdgcn-amd-amdhsa -verify-machineinstrs < %s | FileCheck %s
   2
   3 %struct.ShapeData = type { <4 x float>, <4 x float>, <4 x float>, <4 x float>, <4 x float>, i32, i32, i64, <4 x float>, i32, i8, i8, i16, i32, i32 }
   4
   5 declare float @llvm.fmuladd.f32(float, float, float)
   6
   7 declare <4 x float> @llvm.fmuladd.v4f32(<4 x float>, <4 x float>, <4 x float>)
   8
   9 declare %struct.ShapeData addrspace(1)* @Scene_getSubShapeData(i32, i8 addrspace(1)*, i32 addrspace(1)*) local_unnamed_addr
  10
  11 define <4 x float> @Scene_transformT(i32 %subshapeIdx, <4 x float> %v, float %time, i8 addrspace(1)* %gScene, i32 addrspace(1)* %gSceneOffsets) local_unnamed_addr !dbg !110 {
  12 entry:
  13   ; CHECK: v_mov_b32_e32 v[[COPIED_ARG_PIECE:[0-9]+]], v9
  14
  15   ; CHECK: ;DEBUG_VALUE: Scene_transformT:gScene <- [DW_OP_constu 1, DW_OP_swap, DW_OP_xderef, DW_OP_LLVM_fragment 0 32] $vgpr6
  16   ; CHECK: ;DEBUG_VALUE: Scene_transformT:gScene <- [DW_OP_constu 1, DW_OP_swap, DW_OP_xderef, DW_OP_LLVM_fragment 32 32] $vgpr7
  17   call void @llvm.dbg.value(metadata i8 addrspace(1)* %gScene, metadata !120, metadata !DIExpression(DW_OP_constu, 1, DW_OP_swap, DW_OP_xderef)), !dbg !154
  18   ; CHECK: ;DEBUG_VALUE: Scene_transformT:gSceneOffsets <- [DW_OP_constu 1, DW_OP_swap, DW_OP_xderef, DW_OP_LLVM_fragment 0 32] $vgpr8
  19   ; CHECK: ;DEBUG_VALUE: Scene_transformT:gSceneOffsets <- [DW_OP_constu 1, DW_OP_swap, DW_OP_xderef, DW_OP_LLVM_fragment 32 32] $vgpr[[COPIED_ARG_PIECE]]
  20   call void @llvm.dbg.value(metadata i32 addrspace(1)* %gSceneOffsets, metadata !121, metadata !DIExpression(DW_OP_constu, 1, DW_OP_swap, DW_OP_xderef)), !dbg !155
  21   %call = tail call %struct.ShapeData addrspace(1)* @Scene_getSubShapeData(i32 %subshapeIdx, i8 addrspace(1)* %gScene, i32 addrspace(1)* %gSceneOffsets)
  22   %m_linearMotion = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 2
  23   %tmp = load <4 x float>, <4 x float> addrspace(1)* %m_linearMotion, align 16
  24   %m_angularMotion = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 3
  25   %tmp1 = load <4 x float>, <4 x float> addrspace(1)* %m_angularMotion, align 16
  26   %m_scaleMotion = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 4
  27   %tmp2 = load <4 x float>, <4 x float> addrspace(1)* %m_scaleMotion, align 16
  28   %splat.splatinsert = insertelement <4 x float> undef, float %time, i32 0
  29   %splat.splat = shufflevector <4 x float> %splat.splatinsert, <4 x float> undef, <4 x i32> zeroinitializer
  30   %tmp3 = tail call <4 x float> @llvm.fmuladd.v4f32(<4 x float> %tmp2, <4 x float> %splat.splat, <4 x float> <float 1.000000e+00, float 1.000000e+00, float 1.000000e+00, float 1.000000e+00>)
  31   %m_translation = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 0
  32   %tmp4 = load <4 x float>, <4 x float> addrspace(1)* %m_translation, align 16
  33   %m_quaternion = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 1
  34   %tmp5 = load <4 x float>, <4 x float> addrspace(1)* %m_quaternion, align 16
  35   %m_scale = getelementptr inbounds %struct.ShapeData, %struct.ShapeData addrspace(1)* %call, i64 0, i32 8
  36   %tmp6 = load <4 x float>, <4 x float> addrspace(1)* %m_scale, align 16
  37   %mul = fmul <4 x float> %tmp6, %v
  38   %tmp7 = extractelement <4 x float> %tmp5, i64 0
  39   %sub.i.i = fsub float -0.000000e+00, %tmp7
  40   %vecinit.i.i = insertelement <4 x float> undef, float %sub.i.i, i32 0
  41   %tmp8 = extractelement <4 x float> %tmp5, i64 1
  42   %sub1.i.i = fsub float -0.000000e+00, %tmp8
  43   %vecinit2.i.i = insertelement <4 x float> %vecinit.i.i, float %sub1.i.i, i32 1
  44   %tmp9 = extractelement <4 x float> %tmp5, i64 2
  45   %sub3.i.i = fsub float -0.000000e+00, %tmp9
  46   %vecinit4.i.i = insertelement <4 x float> %vecinit2.i.i, float %sub3.i.i, i32 2
  47   %vecinit5.i.i = shufflevector <4 x float> %vecinit4.i.i, <4 x float> %tmp5, <4 x i32> <i32 0, i32 1, i32 2, i32 7>
  48   %tmp10 = insertelement <4 x float> %mul, float 0.000000e+00, i64 3
  49   %tmp11 = extractelement <4 x float> %mul, i64 2
  50   %tmp12 = extractelement <4 x float> %mul, i64 1
  51   %tmp13 = fmul float %tmp9, %tmp12
  52   %tmp14 = fsub float -0.000000e+00, %tmp13
  53   %tmp15 = tail call float @llvm.fmuladd.f32(float %tmp8, float %tmp11, float %tmp14)
  54   %tmp16 = extractelement <4 x float> %mul, i64 0
  55   %tmp17 = fmul float %tmp7, %tmp11
  56   %tmp18 = fsub float -0.000000e+00, %tmp17
  57   %tmp19 = tail call float @llvm.fmuladd.f32(float %tmp9, float %tmp16, float %tmp18)
  58   %tmp20 = fmul float %tmp8, %tmp16
  59   %tmp21 = fsub float -0.000000e+00, %tmp20
  60   %tmp22 = tail call float @llvm.fmuladd.f32(float %tmp7, float %tmp12, float %tmp21)
  61   %tmp23 = insertelement <4 x float> <float undef, float undef, float undef, float 0.000000e+00>, float %tmp15, i32 0
  62   %tmp24 = insertelement <4 x float> %tmp23, float %tmp19, i32 1
  63   %tmp25 = insertelement <4 x float> %tmp24, float %tmp22, i32 2
  64   %tmp26 = extractelement <4 x float> %tmp5, i64 3
  65   %splat.splat.i8.i = shufflevector <4 x float> %tmp5, <4 x float> undef, <4 x i32> <i32 3, i32 3, i32 3, i32 3>
  66   %splat.splat2.i9.i = shufflevector <4 x float> %tmp10, <4 x float> undef, <4 x i32> <i32 3, i32 3, i32 3, i32 3>
  67   %mul3.i10.i = fmul <4 x float> %tmp5, %splat.splat2.i9.i
  68   %tmp27 = tail call <4 x float> @llvm.fmuladd.v4f32(<4 x float> %splat.splat.i8.i, <4 x float> %tmp10, <4 x float> %mul3.i10.i)
  69   %add.i11.i = fadd <4 x float> %tmp27, %tmp25
  70   %tmp28 = extractelement <4 x float> %tmp5, i32 2
  71   %tmp29 = extractelement <4 x float> %mul, i32 2
  72   %tmp30 = extractelement <4 x float> %tmp5, i32 1
  73   %tmp31 = extractelement <4 x float> %mul, i32 1
  74   %tmp32 = extractelement <4 x float> %tmp5, i32 0
  75   %tmp33 = extractelement <4 x float> %mul, i32 0
  76   %tmp34 = fmul float %tmp32, %tmp33
  77   %tmp35 = tail call float @llvm.fmuladd.f32(float %tmp30, float %tmp31, float %tmp34)
  78   %tmp36 = tail call float @llvm.fmuladd.f32(float %tmp28, float %tmp29, float %tmp35)
  79   %tmp37 = tail call float @llvm.fmuladd.f32(float 0.000000e+00, float 0.000000e+00, float %tmp36)
  80   %neg.i12.i = fsub float -0.000000e+00, %tmp37
  81   %tmp38 = tail call float @llvm.fmuladd.f32(float %tmp26, float 0.000000e+00, float %neg.i12.i)
  82   %tmp39 = insertelement <4 x float> %add.i11.i, float %tmp38, i64 3
  83   %tmp40 = extractelement <4 x float> %add.i11.i, i64 1
  84   %tmp41 = extractelement <4 x float> %add.i11.i, i64 2
  85   %tmp42 = fmul float %tmp41, %sub1.i.i
  86   %tmp43 = fsub float -0.000000e+00, %tmp42
  87   %tmp44 = tail call float @llvm.fmuladd.f32(float %tmp40, float %sub3.i.i, float %tmp43)
  88   %tmp45 = extractelement <4 x float> %add.i11.i, i64 0
  89   %tmp46 = fmul float %tmp45, %sub3.i.i
  90   %tmp47 = fsub float -0.000000e+00, %tmp46
  91   %tmp48 = tail call float @llvm.fmuladd.f32(float %tmp41, float %sub.i.i, float %tmp47)
  92   %tmp49 = fmul float %tmp40, %sub.i.i
  93   %tmp50 = fsub float -0.000000e+00, %tmp49
  94   %tmp51 = tail call float @llvm.fmuladd.f32(float %tmp45, float %sub1.i.i, float %tmp50)
  95   %tmp52 = insertelement <4 x float> <float undef, float undef, float undef, float 0.000000e+00>, float %tmp44, i32 0
  96   %tmp53 = insertelement <4 x float> %tmp52, float %tmp48, i32 1
  97   %tmp54 = insertelement <4 x float> %tmp53, float %tmp51, i32 2
  98   %splat.splat.i.i = shufflevector <4 x float> %tmp39, <4 x float> undef, <4 x i32> <i32 3, i32 3, i32 3, i32 3>
  99   %tmp55 = extractelement <4 x float> %tmp5, i32 3
 100   %mul3.i.i = fmul <4 x float> %splat.splat.i8.i, %tmp39
 101   %tmp56 = tail call <4 x float> @llvm.fmuladd.v4f32(<4 x float> %splat.splat.i.i, <4 x float> %vecinit5.i.i, <4 x float> %mul3.i.i)
 102   %add.i.i = fadd <4 x float> %tmp56, %tmp54
 103   %tmp57 = extractelement <4 x float> %add.i11.i, i32 2
 104   %tmp58 = extractelement <4 x float> %add.i11.i, i32 1
 105   %tmp59 = extractelement <4 x float> %add.i11.i, i32 0
 106   %tmp60 = fmul float %tmp59, %sub.i.i
 107   %tmp61 = tail call float @llvm.fmuladd.f32(float %tmp58, float %sub1.i.i, float %tmp60)
 108   %tmp62 = tail call float @llvm.fmuladd.f32(float %tmp57, float %sub3.i.i, float %tmp61)
 109   %tmp63 = tail call float @llvm.fmuladd.f32(float 0.000000e+00, float 0.000000e+00, float %tmp62)
 110   %neg.i.i = fsub float -0.000000e+00, %tmp63
 111   %tmp64 = tail call float @llvm.fmuladd.f32(float %tmp38, float %tmp55, float %neg.i.i)
 112   %tmp65 = insertelement <4 x float> %add.i.i, float %tmp64, i64 3
 113   %mul2 = fmul <4 x float> %tmp3, %tmp65
 114   %tmp66 = extractelement <4 x float> %tmp1, i64 3
 115   %mul3 = fmul float %tmp66, %time
 116   %tmp67 = insertelement <4 x float> %tmp1, float 0.000000e+00, i32 3
 117   %tmp68 = shufflevector <4 x float> %tmp67, <4 x float> %tmp1, <4 x i32> <i32 0, i32 5, i32 undef, i32 3>
 118   %vecinit3.i.i = shufflevector <4 x float> %tmp68, <4 x float> %tmp1, <4 x i32> <i32 0, i32 1, i32 6, i32 3>
 119   %tmp69 = fcmp oeq <4 x float> %vecinit3.i.i, zeroinitializer
 120   %tmp70 = sext <4 x i1> %tmp69 to <4 x i32>
 121   %tmp71 = shufflevector <4 x i32> %tmp70, <4 x i32> undef, <2 x i32> <i32 2, i32 3>
 122   %tmp72 = shufflevector <4 x i32> %tmp70, <4 x i32> undef, <2 x i32> <i32 0, i32 1>
 123   %tmp73 = and <2 x i32> %tmp71, %tmp72
 124   %tmp74 = extractelement <2 x i32> %tmp73, i64 0
 125   %tmp75 = extractelement <2 x i32> %tmp73, i64 1
 126   %tmp76 = and i32 %tmp74, %tmp75
 127   %tmp77 = icmp sgt i32 %tmp76, -1
 128   br i1 %tmp77, label %bb, label %qtSet.exit
 129
 130 bb:                                               ; preds = %entry
 131   %tmp78 = extractelement <4 x float> %tmp1, i32 2
 132   %tmp79 = extractelement <4 x float> %tmp1, i32 1
 133   %tmp80 = extractelement <4 x float> %tmp1, i32 0
 134   %tmp81 = fmul float %tmp80, %tmp80
 135   %tmp82 = tail call float @llvm.fmuladd.f32(float %tmp79, float %tmp79, float %tmp81)
 136   %tmp83 = tail call float @llvm.fmuladd.f32(float %tmp78, float %tmp78, float %tmp82)
 137   %tmp84 = tail call float @llvm.fmuladd.f32(float 0.000000e+00, float 0.000000e+00, float %tmp83)
 138   %tmp85 = fcmp olt float %tmp84, 0x3810000000000000
 139   br i1 %tmp85, label %bb86, label %bb96
 140
 141 bb86:                                             ; preds = %bb
 142   %tmp87 = fmul <4 x float> %vecinit3.i.i, <float 0x4550000000000000, float 0x4550000000000000, float 0x4550000000000000, float 0x4550000000000000>
 143   %tmp88 = extractelement <4 x float> %tmp87, i64 3
 144   %tmp89 = extractelement <4 x float> %tmp87, i64 2
 145   %tmp90 = extractelement <4 x float> %tmp87, i64 1
 146   %tmp91 = extractelement <4 x float> %tmp87, i64 0
 147   %tmp92 = fmul float %tmp91, %tmp91
 148   %tmp93 = tail call float @llvm.fmuladd.f32(float %tmp90, float %tmp90, float %tmp92)
 149   %tmp94 = tail call float @llvm.fmuladd.f32(float %tmp89, float %tmp89, float %tmp93)
 150   %tmp95 = tail call float @llvm.fmuladd.f32(float %tmp88, float %tmp88, float %tmp94)
 151   br label %bb141
 152
 153 bb96:                                             ; preds = %bb
 154   %tmp97 = fcmp oeq float %tmp84, 0x7FF0000000000000
 155   br i1 %tmp97, label %bb98, label %bb141
 156
 157 bb98:                                             ; preds = %bb96
 158   %tmp99 = fmul <4 x float> %vecinit3.i.i, <float 0x3BD0000000000000, float 0x3BD0000000000000, float 0x3BD0000000000000, float 0x3BD0000000000000>
 159   %tmp100 = extractelement <4 x float> %tmp99, i64 3
 160   %tmp101 = extractelement <4 x float> %tmp99, i64 2
 161   %tmp102 = extractelement <4 x float> %tmp99, i64 1
 162   %tmp103 = extractelement <4 x float> %tmp99, i64 0
 163   %tmp104 = fmul float %tmp103, %tmp103
 164   %tmp105 = tail call float @llvm.fmuladd.f32(float %tmp102, float %tmp102, float %tmp104)
 165   %tmp106 = tail call float @llvm.fmuladd.f32(float %tmp101, float %tmp101, float %tmp105)
 166   %tmp107 = tail call float @llvm.fmuladd.f32(float %tmp100, float %tmp100, float %tmp106)
 167   %tmp108 = fcmp oeq float %tmp107, 0x7FF0000000000000
 168   br i1 %tmp108, label %bb109, label %bb141
 169
 170 bb109:                                            ; preds = %bb98
 171   %tmp110 = tail call zeroext i1 @llvm.amdgcn.class.f32(float %tmp103, i32 516)
 172   %tmp111 = sext i1 %tmp110 to i32
 173   %tmp112 = insertelement <4 x i32> undef, i32 %tmp111, i32 0
 174   %tmp113 = tail call zeroext i1 @llvm.amdgcn.class.f32(float %tmp102, i32 516)
 175   %tmp114 = sext i1 %tmp113 to i32
 176   %tmp115 = insertelement <4 x i32> %tmp112, i32 %tmp114, i32 1
 177   %tmp116 = tail call zeroext i1 @llvm.amdgcn.class.f32(float %tmp101, i32 516)
 178   %tmp117 = sext i1 %tmp116 to i32
 179   %tmp118 = insertelement <4 x i32> %tmp115, i32 %tmp117, i32 2
 180   %tmp119 = tail call zeroext i1 @llvm.amdgcn.class.f32(float %tmp100, i32 516)
 181   %tmp120 = sext i1 %tmp119 to i32
 182   %tmp121 = insertelement <4 x i32> %tmp118, i32 %tmp120, i32 3
 183   %tmp122 = ashr <4 x i32> %tmp121, <i32 31, i32 31, i32 31, i32 31>
 184   %tmp123 = and <4 x i32> %tmp122, <i32 1065353216, i32 1065353216, i32 1065353216, i32 1065353216>
 185   %tmp124 = bitcast <4 x i32> %tmp123 to <4 x float>
 186   %tmp125 = extractelement <4 x float> %tmp124, i64 0
 187   %tmp126 = tail call float @llvm.copysign.f32(float %tmp125, float %tmp103)
 188   %tmp127 = insertelement <4 x float> undef, float %tmp126, i32 0
 189   %tmp128 = extractelement <4 x float> %tmp124, i64 1
 190   %tmp129 = tail call float @llvm.copysign.f32(float %tmp128, float %tmp102)
 191   %tmp130 = insertelement <4 x float> %tmp127, float %tmp129, i32 1
 192   %tmp131 = extractelement <4 x float> %tmp124, i64 2
 193   %tmp132 = tail call float @llvm.copysign.f32(float %tmp131, float %tmp101)
 194   %tmp133 = insertelement <4 x float> %tmp130, float %tmp132, i32 2
 195   %tmp134 = extractelement <4 x float> %tmp124, i64 3
 196   %tmp135 = tail call float @llvm.copysign.f32(float %tmp134, float %tmp100)
 197   %tmp136 = insertelement <4 x float> %tmp133, float %tmp135, i32 3
 198   %tmp137 = fmul float %tmp126, %tmp126
 199   %tmp138 = tail call float @llvm.fmuladd.f32(float %tmp129, float %tmp129, float %tmp137)
 200   %tmp139 = tail call float @llvm.fmuladd.f32(float %tmp132, float %tmp132, float %tmp138)
 201   %tmp140 = tail call float @llvm.fmuladd.f32(float %tmp135, float %tmp135, float %tmp139)
 202   br label %bb141
 203
 204 bb141:                                            ; preds = %bb109, %bb98, %bb96, %bb86
 205   %tmp142 = phi <4 x float> [ %tmp87, %bb86 ], [ %tmp136, %bb109 ], [ %tmp99, %bb98 ], [ %vecinit3.i.i, %bb96 ]
 206   %tmp143 = phi float [ %tmp95, %bb86 ], [ %tmp140, %bb109 ], [ %tmp107, %bb98 ], [ %tmp84, %bb96 ]
 207   %tmp144 = tail call float @llvm.amdgcn.rsq.f32(float %tmp143)
 208   %tmp145 = insertelement <4 x float> undef, float %tmp144, i32 0
 209   %tmp146 = shufflevector <4 x float> %tmp145, <4 x float> undef, <4 x i32> zeroinitializer
 210   %tmp147 = fmul <4 x float> %tmp142, %tmp146
 211   br label %qtSet.exit
 212
 213 qtSet.exit:                                       ; preds = %bb141, %entry
 214   %tmp148 = phi <4 x float> [ %tmp147, %bb141 ], [ %vecinit3.i.i, %entry ]
 215   %div.i = fmul float %mul3, 5.000000e-01
 216   %cmp.i.i = fcmp olt float %div.i, 0x400921CAC0000000
 217   %cond.i.i = select i1 %cmp.i.i, float 0x401921CAC0000000, float 0.000000e+00
 218   %add.i18.i = fadd float %div.i, %cond.i.i
 219   %cmp1.i.i = fcmp ogt float %add.i18.i, 0x400921CAC0000000
 220   %cond2.i.i = select i1 %cmp1.i.i, float 0x401921CAC0000000, float 0.000000e+00
 221   %sub.i.i48 = fsub float %add.i18.i, %cond2.i.i
 222   %mul.i.i = fmul float %sub.i.i48, 0x3FF45F3060000000
 223   %cmp3.i.i = fcmp olt float %sub.i.i48, 0.000000e+00
 224   %mul5.i.i = select i1 %cmp3.i.i, float 0x3FD9F02F60000000, float 0xBFD9F02F60000000
 225   %mul6.i.i = fmul float %sub.i.i48, %mul5.i.i
 226   %tmp149 = tail call float @llvm.fmuladd.f32(float %mul6.i.i, float %sub.i.i48, float %mul.i.i)
 227   %cmp8.i.i = fcmp olt float %tmp149, 0.000000e+00
 228   %cond9.i.i = select i1 %cmp8.i.i, float -1.000000e+00, float 1.000000e+00
 229   %mul10.i.i = fmul float %tmp149, %cond9.i.i
 230   %neg.i.i49 = fsub float -0.000000e+00, %tmp149
 231   %tmp150 = tail call float @llvm.fmuladd.f32(float %mul10.i.i, float %tmp149, float %neg.i.i49)
 232   %tmp151 = tail call float @llvm.fmuladd.f32(float %tmp150, float 0x3FCCCCCCC0000000, float %tmp149)
 233   %tmp152 = extractelement <4 x float> %tmp148, i64 0
 234   %mul.i = fmul float %tmp151, %tmp152
 235   %tmp153 = insertelement <4 x float> undef, float %mul.i, i64 0
 236   %tmp154 = extractelement <4 x float> %tmp148, i64 1
 237   %mul2.i = fmul float %tmp151, %tmp154
 238   %tmp155 = insertelement <4 x float> %tmp153, float %mul2.i, i64 1
 239   %tmp156 = extractelement <4 x float> %tmp148, i64 2
 240   %mul3.i = fmul float %tmp151, %tmp156
 241   %tmp157 = insertelement <4 x float> %tmp155, float %mul3.i, i64 2
 242   %add.i.i50 = fadd float %div.i, 0x3FF921CAC0000000
 243   %cmp.i.i.i = fcmp olt float %add.i.i50, 0x400921CAC0000000
 244   %cond.i.i.i = select i1 %cmp.i.i.i, float 0x401921CAC0000000, float 0.000000e+00
 245   %add.i.i.i = fadd float %add.i.i50, %cond.i.i.i
 246   %cmp1.i.i.i = fcmp ogt float %add.i.i.i, 0x400921CAC0000000
 247   %cond2.i.i.i = select i1 %cmp1.i.i.i, float 0x401921CAC0000000, float 0.000000e+00
 248   %sub.i.i.i = fsub float %add.i.i.i, %cond2.i.i.i
 249   %mul.i.i.i = fmul float %sub.i.i.i, 0x3FF45F3060000000
 250   %cmp3.i.i.i = fcmp olt float %sub.i.i.i, 0.000000e+00
 251   %mul5.i.i.i = select i1 %cmp3.i.i.i, float 0x3FD9F02F60000000, float 0xBFD9F02F60000000
 252   %mul6.i.i.i = fmul float %sub.i.i.i, %mul5.i.i.i
 253   %tmp158 = tail call float @llvm.fmuladd.f32(float %mul6.i.i.i, float %sub.i.i.i, float %mul.i.i.i)
 254   %cmp8.i.i.i = fcmp olt float %tmp158, 0.000000e+00
 255   %cond9.i.i.i = select i1 %cmp8.i.i.i, float -1.000000e+00, float 1.000000e+00
 256   %mul10.i.i.i = fmul float %tmp158, %cond9.i.i.i
 257   %neg.i.i.i = fsub float -0.000000e+00, %tmp158
 258   %tmp159 = tail call float @llvm.fmuladd.f32(float %mul10.i.i.i, float %tmp158, float %neg.i.i.i)
 259   %tmp160 = tail call float @llvm.fmuladd.f32(float %tmp159, float 0x3FCCCCCCC0000000, float %tmp158)
 260   %tmp161 = insertelement <4 x float> %tmp157, float %tmp160, i64 3
 261   %sub.i.i32 = fsub float -0.000000e+00, %mul.i
 262   %vecinit.i.i33 = insertelement <4 x float> undef, float %sub.i.i32, i32 0
 263   %sub1.i.i34 = fsub float -0.000000e+00, %mul2.i
 264   %vecinit2.i.i35 = insertelement <4 x float> %vecinit.i.i33, float %sub1.i.i34, i32 1
 265   %sub3.i.i36 = fsub float -0.000000e+00, %mul3.i
 266   %vecinit4.i.i37 = insertelement <4 x float> %vecinit2.i.i35, float %sub3.i.i36, i32 2
 267   %vecinit5.i.i38 = shufflevector <4 x float> %vecinit4.i.i37, <4 x float> %tmp161, <4 x i32> <i32 0, i32 1, i32 2, i32 7>
 268   %tmp162 = insertelement <4 x float> %mul2, float 0.000000e+00, i64 3
 269   ret <4 x float> %tmp162
 270 }
 271
 272 declare float @llvm.copysign.f32(float, float)
 273
 274 declare i1 @llvm.amdgcn.class.f32(float, i32)
 275
 276 declare float @llvm.amdgcn.rsq.f32(float)
 277
 278 declare void @llvm.dbg.value(metadata, metadata, metadata)
 279
 280 !llvm.dbg.cu = !{!0}
 281 !llvm.module.flags = !{!104, !105, !106}
 282 !opencl.ocl.version = !{!107}
 283 !llvm.ident = !{!108, !109}
 284
 285 !0 = distinct !DICompileUnit(language: DW_LANG_C99, file: !1, producer: "clang version 7.0.0", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, enums: !2, retainedTypes: !74)
 286 !1 = !DIFile(filename: "tmp.cl", directory: "/home/yaxunl/h/git/llvm/assert")
 287 !2 = !{!3, !27, !37, !42, !46, !51, !55, !68}
 288 !3 = !DICompositeType(tag: DW_TAG_enumeration_type, name: "BrdfType", file: !4, line: 1334, size: 32, elements: !5)
 289 !4 = !DIFile(filename: "GraphMaterialSystemKernels1.cl", directory: "/home/yaxunl/h/git/llvm/assert")
 290 !5 = !{!6, !7, !8, !9, !10, !11, !12, !13, !14, !15, !16, !17, !18, !19, !20, !21, !22, !23, !24, !25, !26}
 291 !6 = !DIEnumerator(name: "BRDF_DEFAULT", value: 0)
 292 !7 = !DIEnumerator(name: "BRDF_LAMBERT", value: 1)
 293 !8 = !DIEnumerator(name: "BRDF_MICROFACET", value: 2)
 294 !9 = !DIEnumerator(name: "BRDF_REFLECT", value: 3)
 295 !10 = !DIEnumerator(name: "BRDF_REFRACT", value: 4)
 296 !11 = !DIEnumerator(name: "BRDF_EMISSIVE", value: 5)
 297 !12 = !DIEnumerator(name: "BRDF_LAYERED", value: 6)
 298 !13 = !DIEnumerator(name: "BRDF_FUR", value: 7)
 299 !14 = !DIEnumerator(name: "BRDF_DIFFUSE_ORENNAYAR", value: 8)
 300 !15 = !DIEnumerator(name: "BRDF_TRANSPARENT", value: 9)
 301 !16 = !DIEnumerator(name: "BRDF_PHONG", value: 10)
 302 !17 = !DIEnumerator(name: "BRDF_WARD", value: 11)
 303 !18 = !DIEnumerator(name: "BRDF_ASHIKHMIN", value: 12)
 304 !19 = !DIEnumerator(name: "BRDF_MICROFACET_GGX", value: 13)
 305 !20 = !DIEnumerator(name: "BRDF_MICROFACET_REFRACTION", value: 14)
 306 !21 = !DIEnumerator(name: "BRDF_PASSTHROUGH", value: 15)
 307 !22 = !DIEnumerator(name: "BRDF_VOLUME", value: 16)
 308 !23 = !DIEnumerator(name: "BRDF_LAMBERT_REFRACTION", value: 17)
 309 !24 = !DIEnumerator(name: "BRDF_MICROFACET_ANISOTROPIC_REFLECTION", value: 18)
 310 !25 = !DIEnumerator(name: "BRDF_MICROFACET_ANISOTROPIC_REFRACTION", value: 19)
 311 !26 = !DIEnumerator(name: "BRDF_MICROFACET_BECKMANN", value: 20)
 312 !27 = !DICompositeType(tag: DW_TAG_enumeration_type, name: "LightType", file: !4, line: 1470, size: 32, elements: !28)
 313 !28 = !{!29, !30, !31, !32, !33, !34, !35, !36}
 314 !29 = !DIEnumerator(name: "LIGHT_POINT", value: 0)
 315 !30 = !DIEnumerator(name: "LIGHT_SPOT", value: 1)
 316 !31 = !DIEnumerator(name: "LIGHT_DIRECTIONAL", value: 2)
 317 !32 = !DIEnumerator(name: "LIGHT_UNIFORM", value: 3)
 318 !33 = !DIEnumerator(name: "LIGHT_MESH", value: 4)
 319 !34 = !DIEnumerator(name: "LIGHT_IBL", value: 5)
 320 !35 = !DIEnumerator(name: "LIGHT_GONIOPHOTO", value: 6)
 321 !36 = !DIEnumerator(name: "LIGHT_SKY", value: 7)
 322 !37 = !DICompositeType(tag: DW_TAG_enumeration_type, file: !4, line: 1569, size: 32, elements: !38)
 323 !38 = !{!39, !40, !41}
 324 !39 = !DIEnumerator(name: "UG3D_FILTER_NEAREST", value: 0)
 325 !40 = !DIEnumerator(name: "UG3D_FILTER_LINEAR", value: 1)
 326 !41 = !DIEnumerator(name: "UG3D_FILTER_MONOTONIC_CUBIC", value: 2)
 327 !42 = !DICompositeType(tag: DW_TAG_enumeration_type, file: !4, line: 1562, size: 32, elements: !43)
 328 !43 = !{!44, !45}
 329 !44 = !DIEnumerator(name: "VH_CHECKER", value: 0)
 330 !45 = !DIEnumerator(name: "VH_OPENVDB", value: 1)
 331 !46 = !DICompositeType(tag: DW_TAG_enumeration_type, file: !4, line: 1554, size: 32, elements: !47)
 332 !47 = !{!48, !49, !50}
 333 !48 = !DIEnumerator(name: "VOLUME_HOMOGENEOUS", value: 0)
 334 !49 = !DIEnumerator(name: "VOLUME_HETEROGENEOUS", value: 1)
 335 !50 = !DIEnumerator(name: "VOLUME_NONE", value: 65535)
 336 !51 = !DICompositeType(tag: DW_TAG_enumeration_type, name: "VolumeFlags", file: !4, line: 1504, size: 32, elements: !52)
 337 !52 = !{!53, !54}
 338 !53 = !DIEnumerator(name: "VFLAGS_NONE", value: 0)
 339 !54 = !DIEnumerator(name: "VFLAGS_SINGLE_SCATTER", value: 1)
 340 !55 = !DICompositeType(tag: DW_TAG_enumeration_type, name: "OffsetIdx", file: !4, line: 1316, size: 32, elements: !56)
 341 !56 = !{!57, !58, !59, !60, !61, !62, !63, !64, !65, !66, !67}
 342 !57 = !DIEnumerator(name: "SCENE_OFFSET_IDX_FACE", value: 0)
 343 !58 = !DIEnumerator(name: "SCENE_OFFSET_IDX_VTX", value: 1)
 344 !59 = !DIEnumerator(name: "SCENE_OFFSET_IDX_N", value: 2)
 345 !60 = !DIEnumerator(name: "SCENE_OFFSET_IDX_TEXCRD", value: 3)
 346 !61 = !DIEnumerator(name: "SCENE_OFFSET_IDX_TEXCRD1", value: 4)
 347 !62 = !DIEnumerator(name: "SCENE_OFFSET_IDX_SUBSHAPE_DATA", value: 5)
 348 !63 = !DIEnumerator(name: "SCENE_OFFSET_IDX_MATERIAL", value: 6)
 349 !64 = !DIEnumerator(name: "SCENE_OFFSET_IDX_MATERIAL_DESC", value: 7)
 350 !65 = !DIEnumerator(name: "SCENE_OFFSET_IDX_GRID3D", value: 8)
 351 !66 = !DIEnumerator(name: "SCENE_OFFSET_IDX_WORLD_VOLUME", value: 9)
 352 !67 = !DIEnumerator(name: "SCENE_OFFSET_INTERVAL", value: 4)
 353 !68 = !DICompositeType(tag: DW_TAG_enumeration_type, file: !4, line: 1972, size: 32, elements: !69)
 354 !69 = !{!70, !71, !72, !73}
 355 !70 = !DIEnumerator(name: "FACE_TRIANGLE", value: 0)
 356 !71 = !DIEnumerator(name: "FACE_LINE_SEGMENT", value: 1)
 357 !72 = !DIEnumerator(name: "FACE_QUAD", value: 2)
 358 !73 = !DIEnumerator(name: "FACE_OTHERS", value: 3)
 359 !74 = !{!75, !77, !80, !83, !84, !87, !88, !102}
 360 !75 = !DIDerivedType(tag: DW_TAG_typedef, name: "u32", file: !4, line: 85, baseType: !76)
 361 !76 = !DIBasicType(name: "unsigned int", size: 32, encoding: DW_ATE_unsigned)
 362 !77 = !DIDerivedType(tag: DW_TAG_typedef, name: "float4", file: !78, line: 127, baseType: !79)
 363 !78 = !DIFile(filename: "/home/yaxunl/h/driver/1490442/opencl/include/opencl-c.h", directory: "/home/yaxunl/h/git/llvm/assert")
 364 !79 = !DICompositeType(tag: DW_TAG_array_type, baseType: !80, size: 128, flags: DIFlagVector, elements: !81)
 365 !80 = !DIBasicType(name: "float", size: 32, encoding: DW_ATE_float)
 366 !81 = !{!82}
 367 !82 = !DISubrange(count: 4)
 368 !83 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
 369 !84 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !85, size: 32, dwarfAddressSpace: 1)
 370 !85 = !DIDerivedType(tag: DW_TAG_const_type, baseType: !86)
 371 !86 = !DIBasicType(name: "half", size: 16, encoding: DW_ATE_float)
 372 !87 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !86, size: 32, dwarfAddressSpace: 1)
 373 !88 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !89, size: 64)
 374 !89 = !DIDerivedType(tag: DW_TAG_typedef, name: "Face", file: !4, line: 1993, baseType: !90)
 375 !90 = distinct !DICompositeType(tag: DW_TAG_structure_type, file: !4, line: 1981, size: 640, elements: !91)
 376 !91 = !{!92, !94, !95, !96, !97, !98, !100, !101}
 377 !92 = !DIDerivedType(tag: DW_TAG_member, name: "m_v", scope: !90, file: !4, line: 1983, baseType: !93, size: 128)
 378 !93 = !DICompositeType(tag: DW_TAG_array_type, baseType: !83, size: 128, elements: !81)
 379 !94 = !DIDerivedType(tag: DW_TAG_member, name: "m_n", scope: !90, file: !4, line: 1984, baseType: !93, size: 128, offset: 128)
 380 !95 = !DIDerivedType(tag: DW_TAG_member, name: "m_t", scope: !90, file: !4, line: 1985, baseType: !93, size: 128, offset: 256)
 381 !96 = !DIDerivedType(tag: DW_TAG_member, name: "m_t1", scope: !90, file: !4, line: 1986, baseType: !93, size: 128, offset: 384)
 382 !97 = !DIDerivedType(tag: DW_TAG_member, name: "m_m", scope: !90, file: !4, line: 1988, baseType: !83, size: 32, offset: 512)
 383 !98 = !DIDerivedType(tag: DW_TAG_member, name: "m_type", scope: !90, file: !4, line: 1989, baseType: !99, size: 32, offset: 544)
 384 !99 = !DIDerivedType(tag: DW_TAG_typedef, name: "FaceType", file: !4, line: 1978, baseType: !68)
 385 !100 = !DIDerivedType(tag: DW_TAG_member, name: "m_lightIdx", scope: !90, file: !4, line: 1990, baseType: !83, size: 32, offset: 576)
 386 !101 = !DIDerivedType(tag: DW_TAG_member, name: "m_padding", scope: !90, file: !4, line: 1991, baseType: !83, size: 32, offset: 608)
 387 !102 = !DIDerivedType(tag: DW_TAG_typedef, name: "u64", file: !4, line: 84, baseType: !103)
 388 !103 = !DIBasicType(name: "long unsigned int", size: 64, encoding: DW_ATE_unsigned)
 389 !104 = !{i32 2, !"Dwarf Version", i32 2}
 390 !105 = !{i32 2, !"Debug Info Version", i32 3}
 391 !106 = !{i32 1, !"wchar_size", i32 4}
 392 !107 = !{i32 2, i32 0}
 393 !108 = !{!"clang version 7.0.0"}
 394 !109 = !{!"clang version 4.0 "}
 395 !110 = distinct !DISubprogram(name: "Scene_transformT", scope: !4, file: !4, line: 2182, type: !111, isLocal: false, isDefinition: true, scopeLine: 2183, flags: DIFlagPrototyped, isOptimized: true, unit: !0, retainedNodes: !116)
 396 !111 = !DISubroutineType(types: !112)
 397 !112 = !{!77, !83, !77, !80, !113, !115}
 398 !113 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !114, size: 64)
 399 !114 = !DIBasicType(name: "char", size: 8, encoding: DW_ATE_signed_char)
 400 !115 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !75, size: 64)
 401 !116 = !{!117, !118, !119, !120, !121, !122, !147, !149, !150, !151, !152, !153}
 402 !117 = !DILocalVariable(name: "subshapeIdx", arg: 1, scope: !110, file: !4, line: 2182, type: !83)
 403 !118 = !DILocalVariable(name: "v", arg: 2, scope: !110, file: !4, line: 2182, type: !77)
 404 !119 = !DILocalVariable(name: "time", arg: 3, scope: !110, file: !4, line: 2182, type: !80)
 405 !120 = !DILocalVariable(name: "gScene", arg: 4, scope: !110, file: !4, line: 2182, type: !113)
 406 !121 = !DILocalVariable(name: "gSceneOffsets", arg: 5, scope: !110, file: !4, line: 2182, type: !115)
 407 !122 = !DILocalVariable(name: "ss", scope: !110, file: !4, line: 2184, type: !123)
 408 !123 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !124, size: 64)
 409 !124 = !DIDerivedType(tag: DW_TAG_typedef, name: "ShapeData", file: !4, line: 1949, baseType: !125)
 410 !125 = distinct !DICompositeType(tag: DW_TAG_structure_type, file: !4, line: 1927, size: 1024, elements: !126)
 411 !126 = !{!127, !128, !130, !131, !132, !133, !134, !135, !136, !137, !138, !141, !142, !145, !146}
 412 !127 = !DIDerivedType(tag: DW_TAG_member, name: "m_translation", scope: !125, file: !4, line: 1929, baseType: !77, size: 128)
 413 !128 = !DIDerivedType(tag: DW_TAG_member, name: "m_quaternion", scope: !125, file: !4, line: 1930, baseType: !129, size: 128, offset: 128)
 414 !129 = !DIDerivedType(tag: DW_TAG_typedef, name: "Quaternion", file: !4, line: 625, baseType: !77)
 415 !130 = !DIDerivedType(tag: DW_TAG_member, name: "m_linearMotion", scope: !125, file: !4, line: 1931, baseType: !77, size: 128, offset: 256)
 416 !131 = !DIDerivedType(tag: DW_TAG_member, name: "m_angularMotion", scope: !125, file: !4, line: 1932, baseType: !77, size: 128, offset: 384)
 417 !132 = !DIDerivedType(tag: DW_TAG_member, name: "m_scaleMotion", scope: !125, file: !4, line: 1933, baseType: !77, size: 128, offset: 512)
 418 !133 = !DIDerivedType(tag: DW_TAG_member, name: "m_rootIdx", scope: !125, file: !4, line: 1935, baseType: !75, size: 32, offset: 640)
 419 !134 = !DIDerivedType(tag: DW_TAG_member, name: "m_materialIdx", scope: !125, file: !4, line: 1936, baseType: !75, size: 32, offset: 672)
 420 !135 = !DIDerivedType(tag: DW_TAG_member, name: "m_shapeAddr", scope: !125, file: !4, line: 1937, baseType: !102, size: 64, offset: 704)
 421 !136 = !DIDerivedType(tag: DW_TAG_member, name: "m_scale", scope: !125, file: !4, line: 1939, baseType: !77, size: 128, offset: 768)
 422 !137 = !DIDerivedType(tag: DW_TAG_member, name: "m_flags", scope: !125, file: !4, line: 1941, baseType: !75, size: 32, offset: 896)
 423 !138 = !DIDerivedType(tag: DW_TAG_member, name: "m_hasUv", scope: !125, file: !4, line: 1942, baseType: !139, size: 8, offset: 928)
 424 !139 = !DIDerivedType(tag: DW_TAG_typedef, name: "u8", file: !4, line: 87, baseType: !140)
 425 !140 = !DIBasicType(name: "unsigned char", size: 8, encoding: DW_ATE_unsigned_char)
 426 !141 = !DIDerivedType(tag: DW_TAG_member, name: "m_padd00", scope: !125, file: !4, line: 1943, baseType: !139, size: 8, offset: 936)
 427 !142 = !DIDerivedType(tag: DW_TAG_member, name: "m_objectGroupId", scope: !125, file: !4, line: 1944, baseType: !143, size: 16, offset: 944)
 428 !143 = !DIDerivedType(tag: DW_TAG_typedef, name: "u16", file: !4, line: 86, baseType: !144)
 429 !144 = !DIBasicType(name: "unsigned short", size: 16, encoding: DW_ATE_unsigned)
 430 !145 = !DIDerivedType(tag: DW_TAG_member, name: "m_faceIndexShift", scope: !125, file: !4, line: 1946, baseType: !75, size: 32, offset: 960)
 431 !146 = !DIDerivedType(tag: DW_TAG_member, name: "m_padd2", scope: !125, file: !4, line: 1947, baseType: !75, size: 32, offset: 992)
 432 !147 = !DILocalVariable(name: "mt", scope: !148, file: !4, line: 2187, type: !77)
 433 !148 = distinct !DILexicalBlock(scope: !110, file: !4, line: 2186, column: 2)
 434 !149 = !DILocalVariable(name: "ma", scope: !148, file: !4, line: 2188, type: !77)
 435 !150 = !DILocalVariable(name: "ms", scope: !148, file: !4, line: 2189, type: !77)
 436 !151 = !DILocalVariable(name: "t", scope: !148, file: !4, line: 2191, type: !77)
 437 !152 = !DILocalVariable(name: "q", scope: !148, file: !4, line: 2193, type: !129)
 438 !153 = !DILocalVariable(name: "w", scope: !148, file: !4, line: 2194, type: !80)
 439 !154 = !DILocation(line: 2182, column: 80, scope: !110)
 440 !155 = !DILocation(line: 2182, column: 102, scope: !110)