1 ; RUN: opt -loop-vectorize -force-vector-width=2 -S %s | FileCheck %s
3 ; Tests with alias sets that contain points with uncomputable bounds because
4 ; they include %offset.1, which is loaded in each loop iteration.
6 ; Alias set with uncomputable bounds contains a single load. We do not need
7 ; runtime checks for that group and it should not block vectorization.
8 define void @test1_uncomputable_bounds_single_load(i32* noalias %ptr.1, i32* noalias %ptr.2, i32* noalias %ptr.3, i64 %N, i64 %X) {
9 ; CHECK-LABEL: define void @test1_uncomputable_bounds_single_load
14 %cond = icmp sgt i64 %N, 0
15 br i1 %cond, label %ph, label %exit
21 %iv = phi i64 [ 0, %ph ], [ %iv.next, %loop ]
22 %gep.1 = getelementptr inbounds i32, i32* %ptr.3, i64 %iv
23 %offset.1 = load i32, i32* %gep.1, align 4
24 %gep.2 = getelementptr inbounds i32, i32* %ptr.2, i32 %offset.1
25 %lv = load i32, i32* %gep.2, align 4
26 %gep.3 = getelementptr inbounds i32, i32* %ptr.1, i64 %iv
27 store i32 %lv , i32* %gep.3, align 4
28 %offset.2 = add nsw i64 %iv, %X
29 %gep.4 = getelementptr inbounds i32, i32* %ptr.1, i64 %offset.2
30 store i32 %lv, i32* %gep.4, align 4
31 %iv.next = add nuw nsw i64 %iv, 1
32 %exitcond = icmp eq i64 %iv.next, %N
33 br i1 %exitcond, label %loop.exit, label %loop
42 ; Alias set with uncomputable bounds contains a single store. We do not need
43 ; runtime checks for that group and it should not block vectorization.
44 define void @test2_uncomputable_bounds_single_store(i32* noalias %ptr.1, i32* noalias %ptr.2, i32* noalias %ptr.3, i64 %N, i64 %X) {
45 ; CHECK-LABEL: define void @test2_uncomputable_bounds_single_store
50 %cond = icmp sgt i64 %N, 0
51 br i1 %cond, label %ph, label %exit
57 %iv = phi i64 [ 0, %ph ], [ %iv.next, %loop ]
58 %gep.1 = getelementptr inbounds i32, i32* %ptr.3, i64 %iv
59 %offset.1 = load i32, i32* %gep.1, align 4
60 %gep.2 = getelementptr inbounds i32, i32* %ptr.2, i32 %offset.1
61 store i32 20, i32* %gep.2, align 4
62 %gep.3 = getelementptr inbounds i32, i32* %ptr.1, i64 %iv
63 store i32 0 , i32* %gep.3, align 4
64 %offset.2 = add nsw i64 %iv, %X
65 %gep.4 = getelementptr inbounds i32, i32* %ptr.1, i64 %offset.2
66 store i32 10, i32* %gep.4, align 4
67 %iv.next = add nuw nsw i64 %iv, 1
68 %exitcond = icmp eq i64 %iv.next, %N
69 br i1 %exitcond, label %loop.exit, label %loop
78 ; Alias set with uncomputable bounds contains a load and a store. This blocks
79 ; vectorization, as we cannot generate runtime-checks for the set.
80 define void @test3_uncomputable_bounds_load_store(i32* noalias %ptr.1, i32* noalias %ptr.2, i32* noalias %ptr.3, i64 %N, i64 %X) {
81 ; CHECK-LABEL: define void @test3_uncomputable_bounds_load_store
82 ; CHECK-NOT: vector.body
85 %cond = icmp sgt i64 %N, 0
86 br i1 %cond, label %ph, label %exit
92 %iv = phi i64 [ 0, %ph ], [ %iv.next, %loop ]
93 %gep.1 = getelementptr inbounds i32, i32* %ptr.3, i64 %iv
94 %offset.1 = load i32, i32* %gep.1, align 4
95 %gep.2 = getelementptr inbounds i32, i32* %ptr.2, i32 %offset.1
96 store i32 20, i32* %gep.2, align 4
97 %gep.22 = getelementptr inbounds i32, i32* %ptr.2, i64 %iv
98 %lv = load i32, i32* %gep.22, align 4
99 %gep.3 = getelementptr inbounds i32, i32* %ptr.1, i64 %iv
100 store i32 %lv , i32* %gep.3, align 4
101 %offset.2 = add nsw i64 %iv, %X
102 %gep.4 = getelementptr inbounds i32, i32* %ptr.1, i64 %offset.2
103 store i32 %lv, i32* %gep.4, align 4
104 %iv.next = add nuw nsw i64 %iv, 1
105 %exitcond = icmp eq i64 %iv.next, %N
106 br i1 %exitcond, label %loop.exit, label %loop
115 ; Alias set with uncomputable bounds contains a load and a store. This blocks
116 ; vectorization, as we cannot generate runtime-checks for the set.
117 define void @test4_uncomputable_bounds_store_store(i32* noalias %ptr.1, i32* noalias %ptr.2, i32* noalias %ptr.3, i64 %N, i64 %X) {
118 ; CHECK-LABEL: define void @test4_uncomputable_bounds_store_store
119 ; CHECK-NOT: vector.body
122 %cond = icmp sgt i64 %N, 0
123 br i1 %cond, label %ph, label %exit
129 %iv = phi i64 [ 0, %ph ], [ %iv.next, %loop ]
130 %gep.1 = getelementptr inbounds i32, i32* %ptr.3, i64 %iv
131 %offset.1 = load i32, i32* %gep.1, align 4
132 %gep.2 = getelementptr inbounds i32, i32* %ptr.2, i32 %offset.1
133 store i32 20, i32* %gep.2, align 4
134 %gep.22 = getelementptr inbounds i32, i32* %ptr.2, i64 %iv
135 store i32 30, i32* %gep.22, align 4
136 %gep.3 = getelementptr inbounds i32, i32* %ptr.1, i64 %iv
137 store i32 0 , i32* %gep.3, align 4
138 %offset.2 = add nsw i64 %iv, %X
139 %gep.4 = getelementptr inbounds i32, i32* %ptr.1, i64 %offset.2
140 store i32 10, i32* %gep.4, align 4
141 %iv.next = add nuw nsw i64 %iv, 1
142 %exitcond = icmp eq i64 %iv.next, %N
143 br i1 %exitcond, label %loop.exit, label %loop