1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
2 ; RUN: llc -mtriple=aarch64-linux -mattr=+neon,+fp8 < %s | FileCheck %s
4 define <8 x bfloat> @test_vbfcvtl1_low(<8 x i8> %vn) {
5 ; CHECK-LABEL: test_vbfcvtl1_low:
7 ; CHECK-NEXT: bf1cvtl v0.8h, v0.8b
9 %res = call <8 x bfloat> @llvm.aarch64.neon.fp8.cvtl1.v8bf16.v8i8(<8 x i8> %vn)
13 define <8 x bfloat> @test_vbfcvtl1_high(<16 x i8> %vn) {
14 ; CHECK-LABEL: test_vbfcvtl1_high:
16 ; CHECK-NEXT: bf1cvtl2 v0.8h, v0.16b
18 %res = call <8 x bfloat> @llvm.aarch64.neon.fp8.cvtl1.v8bf16.v16i8(<16 x i8> %vn)
22 define <8 x bfloat> @test_vbfcvtl2_low(<8 x i8> %vn) {
23 ; CHECK-LABEL: test_vbfcvtl2_low:
25 ; CHECK-NEXT: bf2cvtl v0.8h, v0.8b
27 %res = call <8 x bfloat> @llvm.aarch64.neon.fp8.cvtl2.v8bf16.v8i8(<8 x i8> %vn)
31 define <8 x bfloat> @test_vbfcvtl2_high(<16 x i8> %vn) {
32 ; CHECK-LABEL: test_vbfcvtl2_high:
34 ; CHECK-NEXT: bf2cvtl2 v0.8h, v0.16b
36 %res = call <8 x bfloat> @llvm.aarch64.neon.fp8.cvtl2.v8bf16.v16i8(<16 x i8> %vn)
41 define <8 x half> @test_vfcvtl1_low(<8 x i8> %vn) {
42 ; CHECK-LABEL: test_vfcvtl1_low:
44 ; CHECK-NEXT: f1cvtl v0.8h, v0.8b
46 %res = call <8 x half> @llvm.aarch64.neon.fp8.cvtl1.v8f16.v8i8(<8 x i8> %vn)
50 define <8 x half> @test_vfcvtl1_high(<16 x i8> %vn) {
51 ; CHECK-LABEL: test_vfcvtl1_high:
53 ; CHECK-NEXT: f1cvtl2 v0.8h, v0.16b
55 %res = call <8 x half> @llvm.aarch64.neon.fp8.cvtl1.v8f16.v16i8(<16 x i8> %vn)
59 define <8 x half> @test_vfcvtl2_low(<8 x i8> %vn) {
60 ; CHECK-LABEL: test_vfcvtl2_low:
62 ; CHECK-NEXT: f2cvtl v0.8h, v0.8b
64 %res = call <8 x half> @llvm.aarch64.neon.fp8.cvtl2.v8f16.v8i8(<8 x i8> %vn)
68 define <8 x half> @test_vfcvtl2_high(<16 x i8> %vn) {
69 ; CHECK-LABEL: test_vfcvtl2_high:
71 ; CHECK-NEXT: f2cvtl2 v0.8h, v0.16b
73 %res = call <8 x half> @llvm.aarch64.neon.fp8.cvtl2.v8f16.v16i8(<16 x i8> %vn)
77 define <8 x i8> @test_vcvtn_low_f8_f32(<4 x float> %vn, <4 x float> %vm) {
78 ; CHECK-LABEL: test_vcvtn_low_f8_f32:
80 ; CHECK-NEXT: fcvtn v0.8b, v0.4s, v1.4s
82 %res = call <8 x i8> @llvm.aarch64.neon.fp8.fcvtn.v8i8.v4f32(<4 x float> %vn, <4 x float> %vm)
86 define <16 x i8> @test_vcvtn_high_f8_f32(<16 x i8> %vd, <4 x float> %vn, <4 x float> %vm) {
87 ; CHECK-LABEL: test_vcvtn_high_f8_f32:
89 ; CHECK-NEXT: fcvtn2 v0.16b, v1.4s, v2.4s
91 %res = call <16 x i8> @llvm.aarch64.neon.fp8.fcvtn2.v16i8.v4f32(<16 x i8> %vd, <4 x float> %vn, <4 x float> %vm)
96 define <8 x i8> @test_vcvtn_f8_f16(<4 x half> %vn, <4 x half> %vm) {
97 ; CHECK-LABEL: test_vcvtn_f8_f16:
99 ; CHECK-NEXT: fcvtn v0.8b, v0.4h, v1.4h
101 %res = call <8 x i8> @llvm.aarch64.neon.fp8.fcvtn.v8i8.v4f16(<4 x half> %vn, <4 x half> %vm)
105 define <16 x i8> @test_vcvtn2_f8_f16(<8 x half> %vn, <8 x half> %vm) {
106 ; CHECK-LABEL: test_vcvtn2_f8_f16:
108 ; CHECK-NEXT: fcvtn v0.16b, v0.8h, v1.8h
110 %res = call <16 x i8> @llvm.aarch64.neon.fp8.fcvtn.v16i8.v8f16(<8 x half> %vn, <8 x half> %vm)