1 ; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
2 ; RUN: llc -march=amdgcn -mcpu=tonga -mattr=-flat-for-global -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
4 ; FUNC-LABEL: {{^}}fpext_f32_to_f64:
5 ; SI: v_cvt_f64_f32_e32 {{v\[[0-9]+:[0-9]+\]}}, s{{[0-9]+}}
6 define amdgpu_kernel void @fpext_f32_to_f64(double addrspace(1)* %out, float %in) {
7 %result = fpext float %in to double
8 store double %result, double addrspace(1)* %out
12 ; FUNC-LABEL: {{^}}fpext_v2f32_to_v2f64:
13 ; SI: v_cvt_f64_f32_e32
14 ; SI: v_cvt_f64_f32_e32
15 define amdgpu_kernel void @fpext_v2f32_to_v2f64(<2 x double> addrspace(1)* %out, <2 x float> %in) {
16 %result = fpext <2 x float> %in to <2 x double>
17 store <2 x double> %result, <2 x double> addrspace(1)* %out
21 ; FUNC-LABEL: {{^}}fpext_v3f32_to_v3f64:
22 ; SI: v_cvt_f64_f32_e32
23 ; SI: v_cvt_f64_f32_e32
24 ; SI: v_cvt_f64_f32_e32
25 define amdgpu_kernel void @fpext_v3f32_to_v3f64(<3 x double> addrspace(1)* %out, <3 x float> %in) {
26 %result = fpext <3 x float> %in to <3 x double>
27 store <3 x double> %result, <3 x double> addrspace(1)* %out
31 ; FUNC-LABEL: {{^}}fpext_v4f32_to_v4f64:
32 ; SI: v_cvt_f64_f32_e32
33 ; SI: v_cvt_f64_f32_e32
34 ; SI: v_cvt_f64_f32_e32
35 ; SI: v_cvt_f64_f32_e32
36 define amdgpu_kernel void @fpext_v4f32_to_v4f64(<4 x double> addrspace(1)* %out, <4 x float> %in) {
37 %result = fpext <4 x float> %in to <4 x double>
38 store <4 x double> %result, <4 x double> addrspace(1)* %out
42 ; FUNC-LABEL: {{^}}fpext_v8f32_to_v8f64:
43 ; SI: v_cvt_f64_f32_e32
44 ; SI: v_cvt_f64_f32_e32
45 ; SI: v_cvt_f64_f32_e32
46 ; SI: v_cvt_f64_f32_e32
47 ; SI: v_cvt_f64_f32_e32
48 ; SI: v_cvt_f64_f32_e32
49 ; SI: v_cvt_f64_f32_e32
50 ; SI: v_cvt_f64_f32_e32
51 define amdgpu_kernel void @fpext_v8f32_to_v8f64(<8 x double> addrspace(1)* %out, <8 x float> %in) {
52 %result = fpext <8 x float> %in to <8 x double>
53 store <8 x double> %result, <8 x double> addrspace(1)* %out