1 ; RUN: opt -S < %s -passes=loop-vectorize -force-target-instruction-cost=1 | FileCheck %s
3 target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128-Fn32"
4 target triple = "aarch64-unknown-linux-gnu"
6 @a = dso_local local_unnamed_addr global [32000 x float] zeroinitializer, align 64
7 @b = dso_local local_unnamed_addr global [32000 x float] zeroinitializer, align 64
9 define void @NeoverseV2() #0 {
10 ; CHECK-LABEL: define void @NeoverseV2(
11 ; CHECK: store <4 x float>
20 %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
21 %arrayidx = getelementptr inbounds [32000 x float], ptr @a, i64 0, i64 %indvars.iv
22 %0 = load float, ptr %arrayidx, align 4
23 %arrayidx2 = getelementptr inbounds [32000 x float], ptr @b, i64 0, i64 %indvars.iv
24 %1 = load float, ptr %arrayidx2, align 4
25 %add = fadd fast float %1, %0
26 %2 = add nuw nsw i64 %indvars.iv, 16000
27 %arrayidx5 = getelementptr inbounds [32000 x float], ptr @a, i64 0, i64 %2
28 store float %add, ptr %arrayidx5, align 4
29 %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
30 %exitcond.not = icmp eq i64 %indvars.iv.next, 16000
31 br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
34 define void @GenericCPU() #1 {
35 ; CHECK-LABEL: define void @GenericCPU(
36 ; CHECK: store <vscale x 4 x float>
45 %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ]
46 %arrayidx = getelementptr inbounds [32000 x float], ptr @a, i64 0, i64 %indvars.iv
47 %0 = load float, ptr %arrayidx, align 4
48 %arrayidx2 = getelementptr inbounds [32000 x float], ptr @b, i64 0, i64 %indvars.iv
49 %1 = load float, ptr %arrayidx2, align 4
50 %add = fadd fast float %1, %0
51 %2 = add nuw nsw i64 %indvars.iv, 16000
52 %arrayidx5 = getelementptr inbounds [32000 x float], ptr @a, i64 0, i64 %2
53 store float %add, ptr %arrayidx5, align 4
54 %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
55 %exitcond.not = icmp eq i64 %indvars.iv.next, 16000
56 br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
59 attributes #0 = { vscale_range(1,16) "target-cpu"="neoverse-v2" "target-features"="+sve,+sve2,+v9a" }
60 attributes #1 = { vscale_range(1,16) "target-cpu"="generic" "target-features"="+sve,+v9a" }