1 ; RUN: opt -S -dxil-intrinsic-expansion < %s | FileCheck %s --check-prefix=CHECK
\r
2 ; RUN: opt -S -dxil-intrinsic-expansion -dxil-op-lower -mtriple=dxil-pc-shadermodel6.3-library < %s | FileCheck %s --check-prefix=CHECK
\r
4 ; Make sure dxil operation function calls for step are generated for half/float.
\r
6 declare half @llvm.dx.step.f16(half, half)
\r
7 declare <2 x half> @llvm.dx.step.v2f16(<2 x half>, <2 x half>)
\r
8 declare <3 x half> @llvm.dx.step.v3f16(<3 x half>, <3 x half>)
\r
9 declare <4 x half> @llvm.dx.step.v4f16(<4 x half>, <4 x half>)
\r
11 declare float @llvm.dx.step.f32(float, float)
\r
12 declare <2 x float> @llvm.dx.step.v2f32(<2 x float>, <2 x float>)
\r
13 declare <3 x float> @llvm.dx.step.v3f32(<3 x float>, <3 x float>)
\r
14 declare <4 x float> @llvm.dx.step.v4f32(<4 x float>, <4 x float>)
\r
16 define noundef half @test_step_half(half noundef %p0, half noundef %p1) {
\r
18 ; CHECK: %0 = fcmp olt half %p1, %p0
\r
19 ; CHECK: %1 = select i1 %0, half 0xH0000, half 0xH3C00
\r
20 %hlsl.step = call half @llvm.dx.step.f16(half %p0, half %p1)
\r
24 define noundef <2 x half> @test_step_half2(<2 x half> noundef %p0, <2 x half> noundef %p1) {
\r
26 ; CHECK: %0 = fcmp olt <2 x half> %p1, %p0
\r
27 ; CHECK: %1 = select <2 x i1> %0, <2 x half> zeroinitializer, <2 x half> splat (half 0xH3C00)
\r
28 %hlsl.step = call <2 x half> @llvm.dx.step.v2f16(<2 x half> %p0, <2 x half> %p1)
\r
29 ret <2 x half> %hlsl.step
\r
32 define noundef <3 x half> @test_step_half3(<3 x half> noundef %p0, <3 x half> noundef %p1) {
\r
34 ; CHECK: %0 = fcmp olt <3 x half> %p1, %p0
\r
35 ; CHECK: %1 = select <3 x i1> %0, <3 x half> zeroinitializer, <3 x half> splat (half 0xH3C00)
\r
36 %hlsl.step = call <3 x half> @llvm.dx.step.v3f16(<3 x half> %p0, <3 x half> %p1)
\r
37 ret <3 x half> %hlsl.step
\r
40 define noundef <4 x half> @test_step_half4(<4 x half> noundef %p0, <4 x half> noundef %p1) {
\r
42 ; CHECK: %0 = fcmp olt <4 x half> %p1, %p0
\r
43 ; CHECK: %1 = select <4 x i1> %0, <4 x half> zeroinitializer, <4 x half> splat (half 0xH3C00)
\r
44 %hlsl.step = call <4 x half> @llvm.dx.step.v4f16(<4 x half> %p0, <4 x half> %p1)
\r
45 ret <4 x half> %hlsl.step
\r
48 define noundef float @test_step_float(float noundef %p0, float noundef %p1) {
\r
50 ; CHECK: %0 = fcmp olt float %p1, %p0
\r
51 ; CHECK: %1 = select i1 %0, float 0.000000e+00, float 1.000000e+00
\r
52 %hlsl.step = call float @llvm.dx.step.f32(float %p0, float %p1)
\r
53 ret float %hlsl.step
\r
56 define noundef <2 x float> @test_step_float2(<2 x float> noundef %p0, <2 x float> noundef %p1) {
\r
58 ; CHECK: %0 = fcmp olt <2 x float> %p1, %p0
\r
59 ; CHECK: %1 = select <2 x i1> %0, <2 x float> zeroinitializer, <2 x float> splat (float 1.000000e+00)
\r
60 %hlsl.step = call <2 x float> @llvm.dx.step.v2f32(<2 x float> %p0, <2 x float> %p1)
\r
61 ret <2 x float> %hlsl.step
\r
64 define noundef <3 x float> @test_step_float3(<3 x float> noundef %p0, <3 x float> noundef %p1) {
\r
66 ; CHECK: %0 = fcmp olt <3 x float> %p1, %p0
\r
67 ; CHECK: %1 = select <3 x i1> %0, <3 x float> zeroinitializer, <3 x float> splat (float 1.000000e+00)
\r
68 %hlsl.step = call <3 x float> @llvm.dx.step.v3f32(<3 x float> %p0, <3 x float> %p1)
\r
69 ret <3 x float> %hlsl.step
\r
72 define noundef <4 x float> @test_step_float4(<4 x float> noundef %p0, <4 x float> noundef %p1) {
\r
74 ; CHECK: %0 = fcmp olt <4 x float> %p1, %p0
\r
75 ; CHECK: %1 = select <4 x i1> %0, <4 x float> zeroinitializer, <4 x float> splat (float 1.000000e+00)
\r
76 %hlsl.step = call <4 x float> @llvm.dx.step.v4f32(<4 x float> %p0, <4 x float> %p1)
\r
77 ret <4 x float> %hlsl.step
\r