1 // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py
2 // REQUIRES: aarch64-registered-target
3 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu \
4 // RUN: -target-feature +sve2p1 -S -O1 -Werror -emit-llvm -o - %s | FileCheck %s
5 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu \
6 // RUN: -target-feature +sve2p1 -S -O1 -Werror -emit-llvm -o - -x c++ %s | FileCheck %s -check-prefix=CPP-CHECK
7 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu -target-feature +sve2p1 -S -disable-O0-optnone -Werror -Wall -o /dev/null %s
8 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu \
9 // RUN: -target-feature +sve2p1 -S -O1 -Werror -emit-llvm -o - %s | FileCheck %s
10 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu \
11 // RUN: -target-feature +sve2p1 -S -O1 -Werror -emit-llvm -o - -x c++ %s | FileCheck %s -check-prefix=CPP-CHECK
12 // RUN: %clang_cc1 -fclang-abi-compat=latest -triple aarch64-none-linux-gnu -target-feature +sve2p1 -S -disable-O0-optnone -Werror -Wall -o /dev/null %s
16 // CHECK-LABEL: @test_svpsel_lane_b8(
18 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 15
19 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv16i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 16 x i1> [[P2:%.*]], i32 [[ADD]])
20 // CHECK-NEXT: ret <vscale x 16 x i1> [[TMP0]]
22 // CPP-CHECK-LABEL: @_Z19test_svpsel_lane_b8u10__SVBool_tS_j(
23 // CPP-CHECK-NEXT: entry:
24 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 15
25 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv16i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 16 x i1> [[P2:%.*]], i32 [[ADD]])
26 // CPP-CHECK-NEXT: ret <vscale x 16 x i1> [[TMP0]]
28 svbool_t
test_svpsel_lane_b8(svbool_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
29 return svpsel_lane_b8(p1
, p2
, idx
+ 15);
32 // CHECK-LABEL: @test_svpsel_lane_b16(
34 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 7
35 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> [[P2:%.*]])
36 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv8i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 8 x i1> [[TMP0]], i32 [[ADD]])
37 // CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
39 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_b16u10__SVBool_tS_j(
40 // CPP-CHECK-NEXT: entry:
41 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 7
42 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> [[P2:%.*]])
43 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv8i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 8 x i1> [[TMP0]], i32 [[ADD]])
44 // CPP-CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
46 svbool_t
test_svpsel_lane_b16(svbool_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
47 return svpsel_lane_b16(p1
, p2
, idx
+ 7);
50 // CHECK-LABEL: @test_svpsel_lane_b32(
52 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 3
53 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> [[P2:%.*]])
54 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv4i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 4 x i1> [[TMP0]], i32 [[ADD]])
55 // CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
57 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_b32u10__SVBool_tS_j(
58 // CPP-CHECK-NEXT: entry:
59 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 3
60 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> [[P2:%.*]])
61 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv4i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 4 x i1> [[TMP0]], i32 [[ADD]])
62 // CPP-CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
64 svbool_t
test_svpsel_lane_b32(svbool_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
65 return svpsel_lane_b32(p1
, p2
, idx
+ 3);
68 // CHECK-LABEL: @test_svpsel_lane_b64(
70 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 1
71 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> [[P2:%.*]])
72 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv2i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 2 x i1> [[TMP0]], i32 [[ADD]])
73 // CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
75 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_b64u10__SVBool_tS_j(
76 // CPP-CHECK-NEXT: entry:
77 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 1
78 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> [[P2:%.*]])
79 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv2i1(<vscale x 16 x i1> [[P1:%.*]], <vscale x 2 x i1> [[TMP0]], i32 [[ADD]])
80 // CPP-CHECK-NEXT: ret <vscale x 16 x i1> [[TMP1]]
82 svbool_t
test_svpsel_lane_b64(svbool_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
83 return svpsel_lane_b64(p1
, p2
, idx
+ 1);
86 // CHECK-LABEL: @test_svpsel_lane_c8(
88 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 15
89 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
90 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv16i1(<vscale x 16 x i1> [[TMP0]], <vscale x 16 x i1> [[P2:%.*]], i32 [[ADD]])
91 // CHECK-NEXT: [[TMP2:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP1]])
92 // CHECK-NEXT: ret target("aarch64.svcount") [[TMP2]]
94 // CPP-CHECK-LABEL: @_Z19test_svpsel_lane_c8u11__SVCount_tu10__SVBool_tj(
95 // CPP-CHECK-NEXT: entry:
96 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 15
97 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
98 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv16i1(<vscale x 16 x i1> [[TMP0]], <vscale x 16 x i1> [[P2:%.*]], i32 [[ADD]])
99 // CPP-CHECK-NEXT: [[TMP2:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP1]])
100 // CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP2]]
102 svcount_t
test_svpsel_lane_c8(svcount_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
103 return svpsel_lane_c8(p1
, p2
, idx
+ 15);
106 // CHECK-LABEL: @test_svpsel_lane_c16(
107 // CHECK-NEXT: entry:
108 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 7
109 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
110 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> [[P2:%.*]])
111 // CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv8i1(<vscale x 16 x i1> [[TMP0]], <vscale x 8 x i1> [[TMP1]], i32 [[ADD]])
112 // CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
113 // CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
115 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_c16u11__SVCount_tu10__SVBool_tj(
116 // CPP-CHECK-NEXT: entry:
117 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 7
118 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
119 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 8 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv8i1(<vscale x 16 x i1> [[P2:%.*]])
120 // CPP-CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv8i1(<vscale x 16 x i1> [[TMP0]], <vscale x 8 x i1> [[TMP1]], i32 [[ADD]])
121 // CPP-CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
122 // CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
124 svcount_t
test_svpsel_lane_c16(svcount_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
125 return svpsel_lane_c16(p1
, p2
, idx
+ 7);
128 // CHECK-LABEL: @test_svpsel_lane_c32(
129 // CHECK-NEXT: entry:
130 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 3
131 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
132 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> [[P2:%.*]])
133 // CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv4i1(<vscale x 16 x i1> [[TMP0]], <vscale x 4 x i1> [[TMP1]], i32 [[ADD]])
134 // CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
135 // CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
137 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_c32u11__SVCount_tu10__SVBool_tj(
138 // CPP-CHECK-NEXT: entry:
139 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 3
140 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
141 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 4 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv4i1(<vscale x 16 x i1> [[P2:%.*]])
142 // CPP-CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv4i1(<vscale x 16 x i1> [[TMP0]], <vscale x 4 x i1> [[TMP1]], i32 [[ADD]])
143 // CPP-CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
144 // CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
146 svcount_t
test_svpsel_lane_c32(svcount_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
147 return svpsel_lane_c32(p1
, p2
, idx
+ 3);
150 // CHECK-LABEL: @test_svpsel_lane_c64(
151 // CHECK-NEXT: entry:
152 // CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 1
153 // CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
154 // CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> [[P2:%.*]])
155 // CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv2i1(<vscale x 16 x i1> [[TMP0]], <vscale x 2 x i1> [[TMP1]], i32 [[ADD]])
156 // CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
157 // CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
159 // CPP-CHECK-LABEL: @_Z20test_svpsel_lane_c64u11__SVCount_tu10__SVBool_tj(
160 // CPP-CHECK-NEXT: entry:
161 // CPP-CHECK-NEXT: [[ADD:%.*]] = add i32 [[IDX:%.*]], 1
162 // CPP-CHECK-NEXT: [[TMP0:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.convert.to.svbool.taarch64.svcountt(target("aarch64.svcount") [[P1:%.*]])
163 // CPP-CHECK-NEXT: [[TMP1:%.*]] = tail call <vscale x 2 x i1> @llvm.aarch64.sve.convert.from.svbool.nxv2i1(<vscale x 16 x i1> [[P2:%.*]])
164 // CPP-CHECK-NEXT: [[TMP2:%.*]] = tail call <vscale x 16 x i1> @llvm.aarch64.sve.psel.nxv2i1(<vscale x 16 x i1> [[TMP0]], <vscale x 2 x i1> [[TMP1]], i32 [[ADD]])
165 // CPP-CHECK-NEXT: [[TMP3:%.*]] = tail call target("aarch64.svcount") @llvm.aarch64.sve.convert.from.svbool.taarch64.svcountt(<vscale x 16 x i1> [[TMP2]])
166 // CPP-CHECK-NEXT: ret target("aarch64.svcount") [[TMP3]]
168 svcount_t
test_svpsel_lane_c64(svcount_t p1
, svbool_t p2
, uint32_t idx
) __arm_streaming_compatible
{
169 return svpsel_lane_c64(p1
, p2
, idx
+ 1);