1 //===-- x86_64 implementations of the fma function --------------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #ifndef LLVM_LIBC_SRC_SUPPORT_FPUTIL_X86_64_FMA_H
10 #define LLVM_LIBC_SRC_SUPPORT_FPUTIL_X86_64_FMA_H
12 #include "src/__support/macros/attributes.h" // LIBC_INLINE
13 #include "src/__support/macros/properties/architectures.h"
14 #include "src/__support/macros/properties/cpu_features.h" // LIBC_TARGET_CPU_HAS_FMA
16 #if !defined(LIBC_TARGET_ARCH_IS_X86_64)
17 #error "Invalid include"
20 #if !defined(LIBC_TARGET_CPU_HAS_FMA)
21 #error "FMA instructions are not supported"
24 #include "src/__support/CPP/type_traits.h"
25 #include <immintrin.h>
27 namespace __llvm_libc
{
31 LIBC_INLINE
cpp::enable_if_t
<cpp::is_same_v
<T
, float>, T
> fma(T x
, T y
, T z
) {
33 __m128 xmm
= _mm_load_ss(&x
); // NOLINT
34 __m128 ymm
= _mm_load_ss(&y
); // NOLINT
35 __m128 zmm
= _mm_load_ss(&z
); // NOLINT
36 __m128 r
= _mm_fmadd_ss(xmm
, ymm
, zmm
); // NOLINT
37 _mm_store_ss(&result
, r
); // NOLINT
42 LIBC_INLINE
cpp::enable_if_t
<cpp::is_same_v
<T
, double>, T
> fma(T x
, T y
, T z
) {
44 __m128d xmm
= _mm_load_sd(&x
); // NOLINT
45 __m128d ymm
= _mm_load_sd(&y
); // NOLINT
46 __m128d zmm
= _mm_load_sd(&z
); // NOLINT
47 __m128d r
= _mm_fmadd_sd(xmm
, ymm
, zmm
); // NOLINT
48 _mm_store_sd(&result
, r
); // NOLINT
53 } // namespace __llvm_libc
55 #endif // LLVM_LIBC_SRC_SUPPORT_FPUTIL_X86_64_FMA_H