1 ; RUN: llc -mtriple=amdgcn--amdhsa -verify-machineinstrs < %s | FileCheck -check-prefix=GCN %s
3 ; GCN-LABEL: {{^}}test_default_ci:
4 ; GCN: .amdhsa_dx10_clamp 1
5 ; GCN: .amdhsa_ieee_mode 1
7 define amdgpu_kernel void @test_default_ci(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #0 {
8 store float 0.0, ptr addrspace(1) %out0
9 store double 0.0, ptr addrspace(1) %out1
13 ; GCN-LABEL: {{^}}test_default_vi:
14 ; GCN: .amdhsa_dx10_clamp 1
15 ; GCN: .amdhsa_ieee_mode 1
17 define amdgpu_kernel void @test_default_vi(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #1 {
18 store float 0.0, ptr addrspace(1) %out0
19 store double 0.0, ptr addrspace(1) %out1
23 ; GCN-LABEL: {{^}}test_f64_denormals:
24 ; GCN: .amdhsa_dx10_clamp 1
25 ; GCN: .amdhsa_ieee_mode 1
27 define amdgpu_kernel void @test_f64_denormals(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #2 {
28 store float 0.0, ptr addrspace(1) %out0
29 store double 0.0, ptr addrspace(1) %out1
33 ; GCN-LABEL: {{^}}test_f32_denormals:
34 ; GCN: .amdhsa_dx10_clamp 1
35 ; GCN: .amdhsa_ieee_mode 1
37 define amdgpu_kernel void @test_f32_denormals(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #3 {
38 store float 0.0, ptr addrspace(1) %out0
39 store double 0.0, ptr addrspace(1) %out1
43 ; GCN-LABEL: {{^}}test_f32_f64_denormals:
44 ; GCN: .amdhsa_dx10_clamp 1
45 ; GCN: .amdhsa_ieee_mode 1
47 define amdgpu_kernel void @test_f32_f64_denormals(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #4 {
48 store float 0.0, ptr addrspace(1) %out0
49 store double 0.0, ptr addrspace(1) %out1
53 ; GCN-LABEL: {{^}}test_no_denormals:
54 ; GCN: .amdhsa_dx10_clamp 1
55 ; GCN: .amdhsa_ieee_mode 1
57 define amdgpu_kernel void @test_no_denormals(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #5 {
58 store float 0.0, ptr addrspace(1) %out0
59 store double 0.0, ptr addrspace(1) %out1
63 ; GCN-LABEL: {{^}}test_no_dx10_clamp_vi:
64 ; GCN: .amdhsa_dx10_clamp 0
65 ; GCN: .amdhsa_ieee_mode 1
67 define amdgpu_kernel void @test_no_dx10_clamp_vi(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #6 {
68 store float 0.0, ptr addrspace(1) %out0
69 store double 0.0, ptr addrspace(1) %out1
73 ; GCN-LABEL: {{^}}test_no_ieee_mode_vi:
74 ; GCN: .amdhsa_dx10_clamp 1
75 ; GCN: .amdhsa_ieee_mode 0
77 define amdgpu_kernel void @test_no_ieee_mode_vi(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #7 {
78 store float 0.0, ptr addrspace(1) %out0
79 store double 0.0, ptr addrspace(1) %out1
83 ; GCN-LABEL: {{^}}test_no_ieee_mode_no_dx10_clamp_vi:
84 ; GCN: .amdhsa_dx10_clamp 0
85 ; GCN: .amdhsa_ieee_mode 0
87 define amdgpu_kernel void @test_no_ieee_mode_no_dx10_clamp_vi(ptr addrspace(1) %out0, ptr addrspace(1) %out1) #8 {
88 store float 0.0, ptr addrspace(1) %out0
89 store double 0.0, ptr addrspace(1) %out1
93 attributes #0 = { nounwind "target-cpu"="kaveri" }
94 attributes #1 = { nounwind "target-cpu"="fiji" }
95 attributes #2 = { nounwind "denormal-fp-math-f32"="preserve-sign,preserve-sign" }
96 attributes #3 = { nounwind "denormal-fp-math-f32"="ieee,ieee" "denormal-fp-math"="preserve-sign,preserve-sign" }
97 attributes #4 = { nounwind "denormal-fp-math"="ieee,ieee" }
98 attributes #5 = { nounwind "denormal-fp-math"="preserve-sign,preserve-sign" }
99 attributes #6 = { nounwind "amdgpu-dx10-clamp"="false" "target-cpu"="fiji" }
100 attributes #7 = { nounwind "amdgpu-ieee"="false" "target-cpu"="fiji" }
101 attributes #8 = { nounwind "amdgpu-dx10-clamp"="false" "amdgpu-ieee"="false" "target-cpu"="fiji" }
103 !llvm.module.flags = !{!0}
104 !0 = !{i32 1, !"amdgpu_code_object_version", i32 400}