1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc --mtriple=loongarch64 --mattr=+lsx < %s | FileCheck %s
4 define void @mulhs_v16i8(ptr %res, ptr %a0, ptr %a1) nounwind {
5 ; CHECK-LABEL: mulhs_v16i8:
6 ; CHECK: # %bb.0: # %entry
7 ; CHECK-NEXT: vld $vr0, $a1, 0
8 ; CHECK-NEXT: vld $vr1, $a2, 0
9 ; CHECK-NEXT: vmuh.b $vr0, $vr0, $vr1
10 ; CHECK-NEXT: vst $vr0, $a0, 0
13 %v0 = load <16 x i8>, ptr %a0
14 %v1 = load <16 x i8>, ptr %a1
15 %v0s = sext <16 x i8> %v0 to <16 x i16>
16 %v1s = sext <16 x i8> %v1 to <16 x i16>
17 %m = mul <16 x i16> %v0s, %v1s
18 %s = ashr <16 x i16> %m, <i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8>
19 %v2 = trunc <16 x i16> %s to <16 x i8>
20 store <16 x i8> %v2, ptr %res
24 define void @mulhu_v16i8(ptr %res, ptr %a0, ptr %a1) nounwind {
25 ; CHECK-LABEL: mulhu_v16i8:
26 ; CHECK: # %bb.0: # %entry
27 ; CHECK-NEXT: vld $vr0, $a1, 0
28 ; CHECK-NEXT: vld $vr1, $a2, 0
29 ; CHECK-NEXT: vmuh.bu $vr0, $vr0, $vr1
30 ; CHECK-NEXT: vst $vr0, $a0, 0
33 %v0 = load <16 x i8>, ptr %a0
34 %v1 = load <16 x i8>, ptr %a1
35 %v0z = zext <16 x i8> %v0 to <16 x i16>
36 %v1z = zext <16 x i8> %v1 to <16 x i16>
37 %m = mul <16 x i16> %v0z, %v1z
38 %s = lshr <16 x i16> %m, <i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8, i16 8>
39 %v2 = trunc <16 x i16> %s to <16 x i8>
40 store <16 x i8> %v2, ptr %res
44 define void @mulhs_v8i16(ptr %res, ptr %a0, ptr %a1) nounwind {
45 ; CHECK-LABEL: mulhs_v8i16:
46 ; CHECK: # %bb.0: # %entry
47 ; CHECK-NEXT: vld $vr0, $a1, 0
48 ; CHECK-NEXT: vld $vr1, $a2, 0
49 ; CHECK-NEXT: vmuh.h $vr0, $vr0, $vr1
50 ; CHECK-NEXT: vst $vr0, $a0, 0
53 %v0 = load <8 x i16>, ptr %a0
54 %v1 = load <8 x i16>, ptr %a1
55 %v0s = sext <8 x i16> %v0 to <8 x i32>
56 %v1s = sext <8 x i16> %v1 to <8 x i32>
57 %m = mul <8 x i32> %v0s, %v1s
58 %s = ashr <8 x i32> %m, <i32 16, i32 16, i32 16, i32 16, i32 16, i32 16, i32 16, i32 16>
59 %v2 = trunc <8 x i32> %s to <8 x i16>
60 store <8 x i16> %v2, ptr %res
64 define void @mulhu_v8i16(ptr %res, ptr %a0, ptr %a1) nounwind {
65 ; CHECK-LABEL: mulhu_v8i16:
66 ; CHECK: # %bb.0: # %entry
67 ; CHECK-NEXT: vld $vr0, $a1, 0
68 ; CHECK-NEXT: vld $vr1, $a2, 0
69 ; CHECK-NEXT: vmuh.hu $vr0, $vr0, $vr1
70 ; CHECK-NEXT: vst $vr0, $a0, 0
73 %v0 = load <8 x i16>, ptr %a0
74 %v1 = load <8 x i16>, ptr %a1
75 %v0z = zext <8 x i16> %v0 to <8 x i32>
76 %v1z = zext <8 x i16> %v1 to <8 x i32>
77 %m = mul <8 x i32> %v0z, %v1z
78 %s = lshr <8 x i32> %m, <i32 16, i32 16, i32 16, i32 16, i32 16, i32 16, i32 16, i32 16>
79 %v2 = trunc <8 x i32> %s to <8 x i16>
80 store <8 x i16> %v2, ptr %res
84 define void @mulhs_v4i32(ptr %res, ptr %a0, ptr %a1) nounwind {
85 ; CHECK-LABEL: mulhs_v4i32:
86 ; CHECK: # %bb.0: # %entry
87 ; CHECK-NEXT: vld $vr0, $a1, 0
88 ; CHECK-NEXT: vld $vr1, $a2, 0
89 ; CHECK-NEXT: vmuh.w $vr0, $vr0, $vr1
90 ; CHECK-NEXT: vst $vr0, $a0, 0
93 %v0 = load <4 x i32>, ptr %a0
94 %v1 = load <4 x i32>, ptr %a1
95 %v0s = sext <4 x i32> %v0 to <4 x i64>
96 %v1s = sext <4 x i32> %v1 to <4 x i64>
97 %m = mul <4 x i64> %v0s, %v1s
98 %s = ashr <4 x i64> %m, <i64 32, i64 32, i64 32, i64 32>
99 %v2 = trunc <4 x i64> %s to <4 x i32>
100 store <4 x i32> %v2, ptr %res
104 define void @mulhu_v4i32(ptr %res, ptr %a0, ptr %a1) nounwind {
105 ; CHECK-LABEL: mulhu_v4i32:
106 ; CHECK: # %bb.0: # %entry
107 ; CHECK-NEXT: vld $vr0, $a1, 0
108 ; CHECK-NEXT: vld $vr1, $a2, 0
109 ; CHECK-NEXT: vmuh.wu $vr0, $vr0, $vr1
110 ; CHECK-NEXT: vst $vr0, $a0, 0
113 %v0 = load <4 x i32>, ptr %a0
114 %v1 = load <4 x i32>, ptr %a1
115 %v0z = zext <4 x i32> %v0 to <4 x i64>
116 %v1z = zext <4 x i32> %v1 to <4 x i64>
117 %m = mul <4 x i64> %v0z, %v1z
118 %s = lshr <4 x i64> %m, <i64 32, i64 32, i64 32, i64 32>
119 %v2 = trunc <4 x i64> %s to <4 x i32>
120 store <4 x i32> %v2, ptr %res
124 define void @mulhs_v2i64(ptr %res, ptr %a0, ptr %a1) nounwind {
125 ; CHECK-LABEL: mulhs_v2i64:
126 ; CHECK: # %bb.0: # %entry
127 ; CHECK-NEXT: vld $vr0, $a1, 0
128 ; CHECK-NEXT: vld $vr1, $a2, 0
129 ; CHECK-NEXT: vmuh.d $vr0, $vr0, $vr1
130 ; CHECK-NEXT: vst $vr0, $a0, 0
133 %v0 = load <2 x i64>, ptr %a0
134 %v1 = load <2 x i64>, ptr %a1
135 %v0s = sext <2 x i64> %v0 to <2 x i128>
136 %v1s = sext <2 x i64> %v1 to <2 x i128>
137 %m = mul <2 x i128> %v0s, %v1s
138 %s = ashr <2 x i128> %m, <i128 64, i128 64>
139 %v2 = trunc <2 x i128> %s to <2 x i64>
140 store <2 x i64> %v2, ptr %res
144 define void @mulhu_v2i64(ptr %res, ptr %a0, ptr %a1) nounwind {
145 ; CHECK-LABEL: mulhu_v2i64:
146 ; CHECK: # %bb.0: # %entry
147 ; CHECK-NEXT: vld $vr0, $a1, 0
148 ; CHECK-NEXT: vld $vr1, $a2, 0
149 ; CHECK-NEXT: vmuh.du $vr0, $vr0, $vr1
150 ; CHECK-NEXT: vst $vr0, $a0, 0
153 %v0 = load <2 x i64>, ptr %a0
154 %v1 = load <2 x i64>, ptr %a1
155 %v0z = zext <2 x i64> %v0 to <2 x i128>
156 %v1z = zext <2 x i64> %v1 to <2 x i128>
157 %m = mul <2 x i128> %v0z, %v1z
158 %s = lshr <2 x i128> %m, <i128 64, i128 64>
159 %v2 = trunc <2 x i128> %s to <2 x i64>
160 store <2 x i64> %v2, ptr %res