1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=avx | FileCheck %s
4 ; @fptoui_zext is legal to optimize to a single vcvttps2dq: if one of the i8
5 ; results of fptoui is poisoned, the corresponding i32 result of the zext is
6 ; also poisoned. We currently don't implement this optimization.
8 define <16 x i8> @fptoui_zext(<4 x float> %arg) {
9 ; CHECK-LABEL: fptoui_zext:
11 ; CHECK-NEXT: vcvttps2dq %xmm0, %xmm0
12 ; CHECK-NEXT: vpackusdw %xmm0, %xmm0, %xmm0
13 ; CHECK-NEXT: vpackuswb %xmm0, %xmm0, %xmm0
14 ; CHECK-NEXT: vpmovzxbd {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero
16 %f = fptoui <4 x float> %arg to <4 x i8>
17 %z = zext <4 x i8> %f to <4 x i32>
18 %b = bitcast <4 x i32> %z to <16 x i8>
22 ; In @fptoui_shuffle, we must preserve the vpand for correctnesss. Only the
23 ; i8 values extracted from %s are poison. The values from the zeroinitializer
26 define <16 x i8> @fptoui_shuffle(<4 x float> %arg) {
27 ; CHECK-LABEL: fptoui_shuffle:
29 ; CHECK-NEXT: vcvttps2dq %xmm0, %xmm0
30 ; CHECK-NEXT: vandps {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
32 %f = fptoui <4 x float> %arg to <4 x i8>
33 %s = shufflevector <4 x i8> %f, <4 x i8> undef, <16 x i32> <i32 0, i32 1, i32 2, i32 3, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef, i32 undef>
34 %ss = shufflevector <16 x i8> %s, <16 x i8> zeroinitializer, <16 x i32> <i32 0, i32 17, i32 18, i32 19, i32 1, i32 21, i32 22, i32 23, i32 2, i32 25, i32 26, i32 27, i32 3, i32 29, i32 30, i32 31>