Run DCE after a LoopFlatten test to reduce spurious output [nfc]
[llvm-project.git] / clang / test / CodeGenOpenCL / preserve_vec3.cl
blob19f0cdff60a9d6d141206259ad9c897428043f5c
1 // RUN: %clang_cc1 %s -emit-llvm -o - -triple spir-unknown-unknown -fpreserve-vec3-type | FileCheck %s
3 typedef char char3 __attribute__((ext_vector_type(3)));
4 typedef char char8 __attribute__((ext_vector_type(8)));
5 typedef short short3 __attribute__((ext_vector_type(3)));
6 typedef double double2 __attribute__((ext_vector_type(2)));
7 typedef float float3 __attribute__((ext_vector_type(3)));
8 typedef float float4 __attribute__((ext_vector_type(4)));
10 void kernel foo(global float3 *a, global float3 *b) {
11 // CHECK-LABEL: spir_kernel void @foo
12 // CHECK: %[[LOAD_A:.*]] = load <3 x float>, ptr addrspace(1) %a
13 // CHECK: store <3 x float> %[[LOAD_A]], ptr addrspace(1) %b
14 *b = *a;
17 void kernel float4_to_float3(global float3 *a, global float4 *b) {
18 // CHECK-LABEL: spir_kernel void @float4_to_float3
19 // CHECK: %[[LOAD_A:.*]] = load <4 x float>, ptr addrspace(1) %b, align 16
20 // CHECK: %[[ASTYPE:.*]] = shufflevector <4 x float> %[[LOAD_A]], <4 x float> poison, <3 x i32> <i32 0, i32 1, i32 2>
21 // CHECK: store <3 x float> %[[ASTYPE]], ptr addrspace(1) %a, align 16
22 *a = __builtin_astype(*b, float3);
25 void kernel float3_to_float4(global float3 *a, global float4 *b) {
26 // CHECK-LABEL: spir_kernel void @float3_to_float4
27 // CHECK: %[[LOAD_A:.*]] = load <3 x float>, ptr addrspace(1) %a, align 16
28 // CHECK: %[[ASTYPE:.*]] = shufflevector <3 x float> %[[LOAD_A]], <3 x float> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 poison>
29 // CHECK: store <4 x float> %[[ASTYPE]], ptr addrspace(1) %b, align 16
30 *b = __builtin_astype(*a, float4);
33 void kernel float3_to_double2(global float3 *a, global double2 *b) {
34 // CHECK-LABEL: spir_kernel void @float3_to_double2
35 // CHECK: %[[LOAD_A:.*]] = load <3 x float>, ptr addrspace(1) %a, align 16
36 // CHECK: %[[ASTYPE:.*]] = shufflevector <3 x float> %[[LOAD_A]], <3 x float> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 poison>
37 // CHECK: store <4 x float> %[[ASTYPE]], ptr addrspace(1) %b, align 16
38 *b = __builtin_astype(*a, double2);
41 void kernel char8_to_short3(global short3 *a, global char8 *b) {
42 // CHECK-LABEL: spir_kernel void @char8_to_short3
43 // CHECK: %[[LOAD_B:.*]] = load <4 x i16>, ptr addrspace(1) %b
44 // CHECK: %[[ASTYPE:.*]] = shufflevector <4 x i16> %[[LOAD_B]], <4 x i16> poison, <3 x i32> <i32 0, i32 1, i32 2>
45 // CHECK: store <3 x i16> %[[ASTYPE]], ptr addrspace(1) %a, align 8
46 *a = __builtin_astype(*b, short3);
49 void from_char3(char3 a, global int *out) {
50 // CHECK-LABEL: void @from_char3
51 // CHECK: %[[ASTYPE:.*]] = shufflevector <3 x i8> %a, <3 x i8> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 poison>
52 // CHECK: store <4 x i8> %[[ASTYPE]], ptr addrspace(1) %out
53 *out = __builtin_astype(a, int);
56 void from_short3(short3 a, global long *out) {
57 // CHECK-LABEL: void @from_short3
58 // CHECK: %[[ASTYPE:.*]] = shufflevector <3 x i16> %a, <3 x i16> poison, <4 x i32> <i32 0, i32 1, i32 2, i32 poison>
59 // CHECK: store <4 x i16> %[[ASTYPE]], ptr addrspace(1) %out
60 *out = __builtin_astype(a, long);
63 void scalar_to_char3(int a, global char3 *out) {
64 // CHECK-LABEL: void @scalar_to_char3
65 // CHECK: %[[IN_BC:.*]] = bitcast i32 %a to <4 x i8>
66 // CHECK: %[[ASTYPE:.*]] = shufflevector <4 x i8> %[[IN_BC]], <4 x i8> poison, <3 x i32> <i32 0, i32 1, i32 2>
67 // CHECK: store <3 x i8> %[[ASTYPE]], ptr addrspace(1) %out
68 *out = __builtin_astype(a, char3);
71 void scalar_to_short3(long a, global short3 *out) {
72 // CHECK-LABEL: void @scalar_to_short3
73 // CHECK: %[[IN_BC:.*]] = bitcast i64 %a to <4 x i16>
74 // CHECK: %[[ASTYPE:.*]] = shufflevector <4 x i16> %[[IN_BC]], <4 x i16> poison, <3 x i32> <i32 0, i32 1, i32 2>
75 // CHECK: store <3 x i16> %[[ASTYPE]], ptr addrspace(1) %out
76 *out = __builtin_astype(a, short3);