1 ; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2 ; RUN: opt < %s -passes=instcombine -S | FileCheck %s
4 define i32 @extractelement_in_range(<vscale x 4 x i32> %a) {
5 ; CHECK-LABEL: @extractelement_in_range(
6 ; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[A:%.*]], i64 1
7 ; CHECK-NEXT: ret i32 [[R]]
9 %r = extractelement <vscale x 4 x i32> %a, i64 1
13 define i32 @extractelement_maybe_out_of_range(<vscale x 4 x i32> %a) {
14 ; CHECK-LABEL: @extractelement_maybe_out_of_range(
15 ; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[A:%.*]], i64 4
16 ; CHECK-NEXT: ret i32 [[R]]
18 %r = extractelement <vscale x 4 x i32> %a, i64 4
22 define i32 @extractelement_bitcast(float %f) {
23 ; CHECK-LABEL: @extractelement_bitcast(
24 ; CHECK-NEXT: [[R:%.*]] = bitcast float [[F:%.*]] to i32
25 ; CHECK-NEXT: ret i32 [[R]]
27 %vec_float = insertelement <vscale x 4 x float> undef, float %f, i32 0
28 %vec_int = bitcast <vscale x 4 x float> %vec_float to <vscale x 4 x i32>
29 %r = extractelement <vscale x 4 x i32> %vec_int, i32 0
33 define i8 @extractelement_bitcast_to_trunc(<vscale x 2 x i32> %a, i32 %x) {
34 ; CHECK-LABEL: @extractelement_bitcast_to_trunc(
35 ; CHECK-NEXT: [[R:%.*]] = trunc i32 [[X:%.*]] to i8
36 ; CHECK-NEXT: ret i8 [[R]]
38 %vec = insertelement <vscale x 2 x i32> %a, i32 %x, i32 1
39 %vec_cast = bitcast <vscale x 2 x i32> %vec to <vscale x 8 x i8>
40 %r = extractelement <vscale x 8 x i8> %vec_cast, i32 4
44 define i8 @extractelement_bitcast_useless_insert(<vscale x 2 x i32> %a, i32 %x) {
45 ; CHECK-LABEL: @extractelement_bitcast_useless_insert(
46 ; CHECK-NEXT: [[TMP1:%.*]] = bitcast <vscale x 2 x i32> [[A:%.*]] to <vscale x 8 x i8>
47 ; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 8 x i8> [[TMP1]], i64 2
48 ; CHECK-NEXT: ret i8 [[R]]
50 %vec = insertelement <vscale x 2 x i32> %a, i32 %x, i32 1 ; <- This insert could be removed.
51 %vec_cast = bitcast <vscale x 2 x i32> %vec to <vscale x 8 x i8>
52 %r = extractelement <vscale x 8 x i8> %vec_cast, i32 2
56 define i32 @extractelement_shuffle_maybe_out_of_range(i32 %v) {
57 ; CHECK-LABEL: @extractelement_shuffle_maybe_out_of_range(
58 ; CHECK-NEXT: [[IN:%.*]] = insertelement <vscale x 4 x i32> undef, i32 [[V:%.*]], i64 0
59 ; CHECK-NEXT: [[SPLAT:%.*]] = shufflevector <vscale x 4 x i32> [[IN]], <vscale x 4 x i32> poison, <vscale x 4 x i32> zeroinitializer
60 ; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[SPLAT]], i64 4
61 ; CHECK-NEXT: ret i32 [[R]]
63 %in = insertelement <vscale x 4 x i32> undef, i32 %v, i32 0
64 %splat = shufflevector <vscale x 4 x i32> %in, <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer
65 %r = extractelement <vscale x 4 x i32> %splat, i32 4
69 define i32 @extractelement_shuffle_invalid_index(i32 %v) {
70 ; CHECK-LABEL: @extractelement_shuffle_invalid_index(
71 ; CHECK-NEXT: [[IN:%.*]] = insertelement <vscale x 4 x i32> undef, i32 [[V:%.*]], i64 0
72 ; CHECK-NEXT: [[SPLAT:%.*]] = shufflevector <vscale x 4 x i32> [[IN]], <vscale x 4 x i32> poison, <vscale x 4 x i32> zeroinitializer
73 ; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[SPLAT]], i64 4294967295
74 ; CHECK-NEXT: ret i32 [[R]]
76 %in = insertelement <vscale x 4 x i32> undef, i32 %v, i32 0
77 %splat = shufflevector <vscale x 4 x i32> %in, <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer
78 %r = extractelement <vscale x 4 x i32> %splat, i32 -1
82 define <vscale x 4 x i32> @extractelement_insertelement_same_positions(<vscale x 4 x i32> %vec) {
83 ; CHECK-LABEL: @extractelement_insertelement_same_positions(
84 ; CHECK-NEXT: ret <vscale x 4 x i32> [[VEC:%.*]]
86 %vec.e0 = extractelement <vscale x 4 x i32> %vec, i32 0
87 %vec.e1 = extractelement <vscale x 4 x i32> %vec, i32 1
88 %vec.e2 = extractelement <vscale x 4 x i32> %vec, i32 2
89 %vec.e3 = extractelement <vscale x 4 x i32> %vec, i32 3
90 %1 = insertelement <vscale x 4 x i32> %vec, i32 %vec.e0, i32 0
91 %2 = insertelement <vscale x 4 x i32> %1, i32 %vec.e1, i32 1
92 %3 = insertelement <vscale x 4 x i32> %2, i32 %vec.e2, i32 2
93 %4 = insertelement <vscale x 4 x i32> %3, i32 %vec.e3, i32 3
94 ret <vscale x 4 x i32> %4
97 define <vscale x 4 x i32> @extractelement_insertelement_diff_positions(<vscale x 4 x i32> %vec) {
98 ; CHECK-LABEL: @extractelement_insertelement_diff_positions(
99 ; CHECK-NEXT: [[VEC_E0:%.*]] = extractelement <vscale x 4 x i32> [[VEC:%.*]], i64 4
100 ; CHECK-NEXT: [[VEC_E1:%.*]] = extractelement <vscale x 4 x i32> [[VEC]], i64 5
101 ; CHECK-NEXT: [[VEC_E2:%.*]] = extractelement <vscale x 4 x i32> [[VEC]], i64 6
102 ; CHECK-NEXT: [[VEC_E3:%.*]] = extractelement <vscale x 4 x i32> [[VEC]], i64 7
103 ; CHECK-NEXT: [[TMP1:%.*]] = insertelement <vscale x 4 x i32> [[VEC]], i32 [[VEC_E0]], i64 0
104 ; CHECK-NEXT: [[TMP2:%.*]] = insertelement <vscale x 4 x i32> [[TMP1]], i32 [[VEC_E1]], i64 1
105 ; CHECK-NEXT: [[TMP3:%.*]] = insertelement <vscale x 4 x i32> [[TMP2]], i32 [[VEC_E2]], i64 2
106 ; CHECK-NEXT: [[TMP4:%.*]] = insertelement <vscale x 4 x i32> [[TMP3]], i32 [[VEC_E3]], i64 3
107 ; CHECK-NEXT: ret <vscale x 4 x i32> [[TMP4]]
109 %vec.e0 = extractelement <vscale x 4 x i32> %vec, i32 4
110 %vec.e1 = extractelement <vscale x 4 x i32> %vec, i32 5
111 %vec.e2 = extractelement <vscale x 4 x i32> %vec, i32 6
112 %vec.e3 = extractelement <vscale x 4 x i32> %vec, i32 7
113 %1 = insertelement <vscale x 4 x i32> %vec, i32 %vec.e0, i32 0
114 %2 = insertelement <vscale x 4 x i32> %1, i32 %vec.e1, i32 1
115 %3 = insertelement <vscale x 4 x i32> %2, i32 %vec.e2, i32 2
116 %4 = insertelement <vscale x 4 x i32> %3, i32 %vec.e3, i32 3
117 ret <vscale x 4 x i32> %4
120 define i32 @bitcast_of_extractelement( <vscale x 2 x float> %d) {
121 ; CHECK-LABEL: @bitcast_of_extractelement(
122 ; CHECK-NEXT: [[BC:%.*]] = bitcast <vscale x 2 x float> [[D:%.*]] to <vscale x 2 x i32>
123 ; CHECK-NEXT: [[CAST:%.*]] = extractelement <vscale x 2 x i32> [[BC]], i64 0
124 ; CHECK-NEXT: ret i32 [[CAST]]
126 %ext = extractelement <vscale x 2 x float> %d, i32 0
127 %cast = bitcast float %ext to i32
131 define i1 @extractelement_is_zero(<vscale x 2 x i32> %d, i1 %b, i32 %z) {
132 ; CHECK-LABEL: @extractelement_is_zero(
133 ; CHECK-NEXT: [[EXT:%.*]] = extractelement <vscale x 2 x i32> [[D:%.*]], i64 0
134 ; CHECK-NEXT: [[BB:%.*]] = icmp eq i32 [[EXT]], 0
135 ; CHECK-NEXT: ret i1 [[BB]]
137 %ext = extractelement <vscale x 2 x i32> %d, i32 0
138 %bb = icmp eq i32 %ext, 0
143 ; https://bugs.chromium.org/p/oss-fuzz/issues/detail?id=25272
144 define i32 @ossfuzz_25272(float %f) {
145 ; CHECK-LABEL: @ossfuzz_25272(
146 ; CHECK-NEXT: [[VEC_FLOAT:%.*]] = insertelement <vscale x 4 x float> undef, float [[F:%.*]], i64 0
147 ; CHECK-NEXT: [[VEC_INT:%.*]] = bitcast <vscale x 4 x float> [[VEC_FLOAT]] to <vscale x 4 x i32>
148 ; CHECK-NEXT: [[E:%.*]] = extractelement <vscale x 4 x i32> [[VEC_INT]], i64 2147483647
149 ; CHECK-NEXT: ret i32 [[E]]
151 %vec_float = insertelement <vscale x 4 x float> undef, float %f, i32 0
152 %vec_int = bitcast <vscale x 4 x float> %vec_float to <vscale x 4 x i32>
153 %E = extractelement <vscale x 4 x i32> %vec_int, i32 2147483647
157 ; Step vector optimization
159 define i64 @ext_lane0_from_stepvec() {
160 ; CHECK-LABEL: @ext_lane0_from_stepvec(
162 ; CHECK-NEXT: ret i64 0
165 %0 = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
166 %1 = extractelement <vscale x 4 x i64> %0, i32 0
170 define i32 @ext_lane3_from_stepvec() {
171 ; CHECK-LABEL: @ext_lane3_from_stepvec(
173 ; CHECK-NEXT: ret i32 3
176 %0 = call <vscale x 4 x i32> @llvm.stepvector.nxv4i32()
177 %1 = extractelement <vscale x 4 x i32> %0, i64 3
181 define i64 @ext_lane_out_of_range_from_stepvec() {
182 ; CHECK-LABEL: @ext_lane_out_of_range_from_stepvec(
184 ; CHECK-NEXT: [[TMP0:%.*]] = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
185 ; CHECK-NEXT: [[TMP1:%.*]] = extractelement <vscale x 4 x i64> [[TMP0]], i64 4
186 ; CHECK-NEXT: ret i64 [[TMP1]]
189 %0 = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
190 %1 = extractelement <vscale x 4 x i64> %0, i32 4
194 define i64 @ext_lane_invalid_from_stepvec() {
195 ; CHECK-LABEL: @ext_lane_invalid_from_stepvec(
197 ; CHECK-NEXT: [[TMP0:%.*]] = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
198 ; CHECK-NEXT: [[TMP1:%.*]] = extractelement <vscale x 4 x i64> [[TMP0]], i64 4294967295
199 ; CHECK-NEXT: ret i64 [[TMP1]]
202 %0 = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
203 %1 = extractelement <vscale x 4 x i64> %0, i32 -1
207 define i64 @ext_lane_unknown_from_stepvec(i32 %v) {
208 ; CHECK-LABEL: @ext_lane_unknown_from_stepvec(
210 ; CHECK-NEXT: [[TMP0:%.*]] = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
211 ; CHECK-NEXT: [[TMP1:%.*]] = extractelement <vscale x 4 x i64> [[TMP0]], i32 [[V:%.*]]
212 ; CHECK-NEXT: ret i64 [[TMP1]]
215 %0 = call <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
216 %1 = extractelement <vscale x 4 x i64> %0, i32 %v
220 ; Check that poison is returned when the extracted element has wrapped.
222 define i8 @ext_lane256_from_stepvec() {
223 ; CHECK-LABEL: @ext_lane256_from_stepvec(
225 ; CHECK-NEXT: ret i8 poison
228 %0 = call <vscale x 512 x i8> @llvm.stepvector.nxv512i8()
229 %1 = extractelement <vscale x 512 x i8> %0, i64 256
233 define i8 @ext_lane255_from_stepvec() {
234 ; CHECK-LABEL: @ext_lane255_from_stepvec(
236 ; CHECK-NEXT: ret i8 -1
239 %0 = call <vscale x 512 x i8> @llvm.stepvector.nxv512i8()
240 %1 = extractelement <vscale x 512 x i8> %0, i64 255
244 ; Check that we can extract more complex cases where the stepvector is
245 ; involved in a binary operation prior to the lane being extracted.
247 define i64 @ext_lane0_from_add_with_stepvec(i64 %i) {
248 ; CHECK-LABEL: @ext_lane0_from_add_with_stepvec(
249 ; CHECK-NEXT: ret i64 [[I:%.*]]
251 %tmp = insertelement <vscale x 2 x i64> poison, i64 %i, i32 0
252 %splatofi = shufflevector <vscale x 2 x i64> %tmp, <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer
253 %stepvec = call <vscale x 2 x i64> @llvm.stepvector.nxv2i64()
254 %add = add <vscale x 2 x i64> %splatofi, %stepvec
255 %res = extractelement <vscale x 2 x i64> %add, i32 0
259 define i1 @ext_lane1_from_cmp_with_stepvec(i64 %i) {
260 ; CHECK-LABEL: @ext_lane1_from_cmp_with_stepvec(
261 ; CHECK-NEXT: [[RES:%.*]] = icmp eq i64 [[I:%.*]], 1
262 ; CHECK-NEXT: ret i1 [[RES]]
264 %tmp = insertelement <vscale x 2 x i64> poison, i64 %i, i32 0
265 %splatofi = shufflevector <vscale x 2 x i64> %tmp, <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer
266 %stepvec = call <vscale x 2 x i64> @llvm.stepvector.nxv2i64()
267 %cmp = icmp eq <vscale x 2 x i64> %splatofi, %stepvec
268 %res = extractelement <vscale x 2 x i1> %cmp, i32 1
272 define ptr @ext_lane_from_bitcast_of_splat(ptr %v) {
273 ; CHECK-LABEL: @ext_lane_from_bitcast_of_splat(
275 ; CHECK-NEXT: ret ptr [[V:%.*]]
278 %in = insertelement <vscale x 4 x ptr> poison, ptr %v, i32 0
279 %splat = shufflevector <vscale x 4 x ptr> %in, <vscale x 4 x ptr> poison, <vscale x 4 x i32> zeroinitializer
280 %bc = bitcast <vscale x 4 x ptr> %splat to <vscale x 4 x ptr>
281 %r = extractelement <vscale x 4 x ptr> %bc, i32 3
285 declare <vscale x 2 x i64> @llvm.stepvector.nxv2i64()
286 declare <vscale x 4 x i64> @llvm.stepvector.nxv4i64()
287 declare <vscale x 4 x i32> @llvm.stepvector.nxv4i32()
288 declare <vscale x 512 x i8> @llvm.stepvector.nxv512i8()