1 ; RUN: llc -O3 -march=hexagon < %s
4 target triple = "hexagon-unknown--elf"
6 @g0 = external global ptr
8 ; Function Attrs: nounwind
9 define void @f0(ptr nocapture %a0, ptr nocapture %a1, ptr %a2) #0 {
11 %v0 = alloca [64 x float], align 16
12 %v1 = alloca [8 x float], align 8
13 call void @llvm.lifetime.start.p0(i64 256, ptr %v0) #2
14 %v3 = load float, ptr %a0, align 4, !tbaa !0
15 %v4 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 35
16 store float %v3, ptr %v4, align 4, !tbaa !0
17 store float %v3, ptr %v0, align 16, !tbaa !0
18 %v6 = getelementptr inbounds float, ptr %a0, i32 1
19 %v7 = load float, ptr %v6, align 4, !tbaa !0
20 %v8 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 36
21 store float %v7, ptr %v8, align 16, !tbaa !0
22 %v9 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 1
23 store float %v7, ptr %v9, align 4, !tbaa !0
24 %v10 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 37
25 store float 1.000000e+00, ptr %v10, align 4, !tbaa !0
26 %v11 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 2
27 store float 1.000000e+00, ptr %v11, align 8, !tbaa !0
28 %v12 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 34
29 store float 0.000000e+00, ptr %v12, align 8, !tbaa !0
30 %v13 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 33
31 store float 0.000000e+00, ptr %v13, align 4, !tbaa !0
32 %v14 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 32
33 store float 0.000000e+00, ptr %v14, align 16, !tbaa !0
34 %v15 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 5
35 store float 0.000000e+00, ptr %v15, align 4, !tbaa !0
36 %v16 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 4
37 store float 0.000000e+00, ptr %v16, align 16, !tbaa !0
38 %v17 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 3
39 store float 0.000000e+00, ptr %v17, align 4, !tbaa !0
40 %v18 = load float, ptr %a1, align 4, !tbaa !0
41 %v19 = fmul float %v3, %v18
42 %v20 = fsub float -0.000000e+00, %v19
43 %v21 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 6
44 store float %v20, ptr %v21, align 8, !tbaa !0
45 %v22 = fmul float %v7, %v18
46 %v23 = fsub float -0.000000e+00, %v22
47 %v24 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 7
48 store float %v23, ptr %v24, align 4, !tbaa !0
49 %v25 = getelementptr inbounds float, ptr %a1, i32 1
50 %v26 = load float, ptr %v25, align 4, !tbaa !0
51 %v27 = fmul float %v3, %v26
52 %v28 = fsub float -0.000000e+00, %v27
53 %v29 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 38
54 store float %v28, ptr %v29, align 8, !tbaa !0
55 %v30 = fmul float %v7, %v26
56 %v31 = fsub float -0.000000e+00, %v30
57 %v32 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 39
58 store float %v31, ptr %v32, align 4, !tbaa !0
59 store float %v18, ptr %v1, align 8, !tbaa !0
60 %v34 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 4
61 store float %v26, ptr %v34, align 8, !tbaa !0
62 %v35 = getelementptr float, ptr %a0, i32 2
63 %v36 = getelementptr float, ptr %a1, i32 2
64 %v37 = load float, ptr %v35, align 4, !tbaa !0
65 %v38 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 43
66 store float %v37, ptr %v38, align 4, !tbaa !0
67 %v39 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 8
68 store float %v37, ptr %v39, align 16, !tbaa !0
69 %v40 = getelementptr inbounds float, ptr %a0, i32 3
70 %v41 = load float, ptr %v40, align 4, !tbaa !0
71 %v42 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 44
72 store float %v41, ptr %v42, align 16, !tbaa !0
73 %v43 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 9
74 store float %v41, ptr %v43, align 4, !tbaa !0
75 %v44 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 45
76 store float 1.000000e+00, ptr %v44, align 4, !tbaa !0
77 %v45 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 10
78 store float 1.000000e+00, ptr %v45, align 8, !tbaa !0
79 %v46 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 42
80 store float 0.000000e+00, ptr %v46, align 8, !tbaa !0
81 %v47 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 41
82 store float 0.000000e+00, ptr %v47, align 4, !tbaa !0
83 %v48 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 40
84 store float 0.000000e+00, ptr %v48, align 16, !tbaa !0
85 %v49 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 13
86 store float 0.000000e+00, ptr %v49, align 4, !tbaa !0
87 %v50 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 12
88 store float 0.000000e+00, ptr %v50, align 16, !tbaa !0
89 %v51 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 11
90 store float 0.000000e+00, ptr %v51, align 4, !tbaa !0
91 %v52 = load float, ptr %v36, align 4, !tbaa !0
92 %v53 = fmul float %v37, %v52
93 %v54 = fsub float -0.000000e+00, %v53
94 %v55 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 14
95 store float %v54, ptr %v55, align 8, !tbaa !0
96 %v56 = fmul float %v41, %v52
97 %v57 = fsub float -0.000000e+00, %v56
98 %v58 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 15
99 store float %v57, ptr %v58, align 4, !tbaa !0
100 %v59 = getelementptr inbounds float, ptr %a1, i32 3
101 %v60 = load float, ptr %v59, align 4, !tbaa !0
102 %v61 = fmul float %v37, %v60
103 %v62 = fsub float -0.000000e+00, %v61
104 %v63 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 46
105 store float %v62, ptr %v63, align 8, !tbaa !0
106 %v64 = fmul float %v41, %v60
107 %v65 = fsub float -0.000000e+00, %v64
108 %v66 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 47
109 store float %v65, ptr %v66, align 4, !tbaa !0
110 %v67 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 1
111 store float %v52, ptr %v67, align 4, !tbaa !0
112 %v68 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 5
113 store float %v60, ptr %v68, align 4, !tbaa !0
114 %v69 = getelementptr float, ptr %a0, i32 4
115 %v70 = getelementptr float, ptr %a1, i32 4
116 %v71 = load float, ptr %v69, align 4, !tbaa !0
117 %v72 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 51
118 store float %v71, ptr %v72, align 4, !tbaa !0
119 %v73 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 16
120 store float %v71, ptr %v73, align 16, !tbaa !0
121 %v74 = getelementptr inbounds float, ptr %a0, i32 5
122 %v75 = load float, ptr %v74, align 4, !tbaa !0
123 %v76 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 52
124 store float %v75, ptr %v76, align 16, !tbaa !0
125 %v77 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 17
126 store float %v75, ptr %v77, align 4, !tbaa !0
127 %v78 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 53
128 store float 1.000000e+00, ptr %v78, align 4, !tbaa !0
129 %v79 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 18
130 store float 1.000000e+00, ptr %v79, align 8, !tbaa !0
131 %v80 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 50
132 store float 0.000000e+00, ptr %v80, align 8, !tbaa !0
133 %v81 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 49
134 store float 0.000000e+00, ptr %v81, align 4, !tbaa !0
135 %v82 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 48
136 store float 0.000000e+00, ptr %v82, align 16, !tbaa !0
137 %v83 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 21
138 store float 0.000000e+00, ptr %v83, align 4, !tbaa !0
139 %v84 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 20
140 store float 0.000000e+00, ptr %v84, align 16, !tbaa !0
141 %v85 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 19
142 store float 0.000000e+00, ptr %v85, align 4, !tbaa !0
143 %v86 = load float, ptr %v70, align 4, !tbaa !0
144 %v87 = fmul float %v71, %v86
145 %v88 = fsub float -0.000000e+00, %v87
146 %v89 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 22
147 store float %v88, ptr %v89, align 8, !tbaa !0
148 %v90 = fmul float %v75, %v86
149 %v91 = fsub float -0.000000e+00, %v90
150 %v92 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 23
151 store float %v91, ptr %v92, align 4, !tbaa !0
152 %v93 = getelementptr inbounds float, ptr %a1, i32 5
153 %v94 = load float, ptr %v93, align 4, !tbaa !0
154 %v95 = fmul float %v71, %v94
155 %v96 = fsub float -0.000000e+00, %v95
156 %v97 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 54
157 store float %v96, ptr %v97, align 8, !tbaa !0
158 %v98 = fmul float %v75, %v94
159 %v99 = fsub float -0.000000e+00, %v98
160 %v100 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 55
161 store float %v99, ptr %v100, align 4, !tbaa !0
162 %v101 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 2
163 store float %v86, ptr %v101, align 8, !tbaa !0
164 %v102 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 6
165 store float %v94, ptr %v102, align 8, !tbaa !0
166 %v103 = getelementptr float, ptr %a0, i32 6
167 %v104 = getelementptr float, ptr %a1, i32 6
168 %v105 = load float, ptr %v103, align 4, !tbaa !0
169 %v106 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 59
170 store float %v105, ptr %v106, align 4, !tbaa !0
171 %v107 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 24
172 store float %v105, ptr %v107, align 16, !tbaa !0
173 %v108 = getelementptr inbounds float, ptr %a0, i32 7
174 %v109 = load float, ptr %v108, align 4, !tbaa !0
175 %v110 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 60
176 store float %v109, ptr %v110, align 16, !tbaa !0
177 %v111 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 25
178 store float %v109, ptr %v111, align 4, !tbaa !0
179 %v112 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 61
180 store float 1.000000e+00, ptr %v112, align 4, !tbaa !0
181 %v113 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 26
182 store float 1.000000e+00, ptr %v113, align 8, !tbaa !0
183 %v114 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 58
184 store float 0.000000e+00, ptr %v114, align 8, !tbaa !0
185 %v115 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 57
186 store float 0.000000e+00, ptr %v115, align 4, !tbaa !0
187 %v116 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 56
188 store float 0.000000e+00, ptr %v116, align 16, !tbaa !0
189 %v117 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 29
190 store float 0.000000e+00, ptr %v117, align 4, !tbaa !0
191 %v118 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 28
192 store float 0.000000e+00, ptr %v118, align 16, !tbaa !0
193 %v119 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 27
194 store float 0.000000e+00, ptr %v119, align 4, !tbaa !0
195 %v120 = load float, ptr %v104, align 4, !tbaa !0
196 %v121 = fmul float %v105, %v120
197 %v122 = fsub float -0.000000e+00, %v121
198 %v123 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 30
199 store float %v122, ptr %v123, align 8, !tbaa !0
200 %v124 = fmul float %v109, %v120
201 %v125 = fsub float -0.000000e+00, %v124
202 %v126 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 31
203 store float %v125, ptr %v126, align 4, !tbaa !0
204 %v127 = getelementptr inbounds float, ptr %a1, i32 7
205 %v128 = load float, ptr %v127, align 4, !tbaa !0
206 %v129 = fmul float %v105, %v128
207 %v130 = fsub float -0.000000e+00, %v129
208 %v131 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 62
209 store float %v130, ptr %v131, align 8, !tbaa !0
210 %v132 = fmul float %v109, %v128
211 %v133 = fsub float -0.000000e+00, %v132
212 %v134 = getelementptr inbounds [64 x float], ptr %v0, i32 0, i32 63
213 store float %v133, ptr %v134, align 4, !tbaa !0
214 %v135 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 3
215 store float %v120, ptr %v135, align 4, !tbaa !0
216 %v136 = getelementptr inbounds [8 x float], ptr %v1, i32 0, i32 7
217 store float %v128, ptr %v136, align 4, !tbaa !0
218 %v137 = load ptr, ptr @g0, align 4, !tbaa !4
219 %v138 = load ptr, ptr %v137, align 4, !tbaa !4
220 call void %v138(ptr %v0, i32 8, i32 8, ptr %v1, ptr %a2) #2
221 %v139 = getelementptr inbounds float, ptr %a2, i32 8
222 store float 1.000000e+00, ptr %v139, align 4, !tbaa !0
223 call void @llvm.lifetime.end.p0(i64 256, ptr %v0) #2
227 ; Function Attrs: argmemonly nounwind
228 declare void @llvm.lifetime.start.p0(i64, ptr nocapture) #1
230 ; Function Attrs: argmemonly nounwind
231 declare void @llvm.lifetime.end.p0(i64, ptr nocapture) #1
233 attributes #0 = { nounwind "target-cpu"="hexagonv55" }
234 attributes #1 = { argmemonly nounwind }
235 attributes #2 = { nounwind }
237 !0 = !{!1, !1, i64 0}
239 !2 = !{!"omnipotent char", !3}
240 !3 = !{!"Simple C/C++ TBAA"}
241 !4 = !{!5, !5, i64 0}
242 !5 = !{!"any pointer", !2}