[x86] fix assert with horizontal math + broadcast of vector (PR43402)
[llvm-core.git] / lib / Support / BranchProbability.cpp
blob195e2d58d8e191f82a67c2c1b110fd73515d8c7d
1 //===-------------- lib/Support/BranchProbability.cpp -----------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements Branch Probability class.
11 //===----------------------------------------------------------------------===//
13 #include "llvm/Support/BranchProbability.h"
14 #include "llvm/Config/llvm-config.h"
15 #include "llvm/Support/Debug.h"
16 #include "llvm/Support/Format.h"
17 #include "llvm/Support/raw_ostream.h"
18 #include <cassert>
20 using namespace llvm;
22 const uint32_t BranchProbability::D;
24 raw_ostream &BranchProbability::print(raw_ostream &OS) const {
25 if (isUnknown())
26 return OS << "?%";
28 // Get a percentage rounded to two decimal digits. This avoids
29 // implementation-defined rounding inside printf.
30 double Percent = rint(((double)N / D) * 100.0 * 100.0) / 100.0;
31 return OS << format("0x%08" PRIx32 " / 0x%08" PRIx32 " = %.2f%%", N, D,
32 Percent);
35 #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
36 LLVM_DUMP_METHOD void BranchProbability::dump() const { print(dbgs()) << '\n'; }
37 #endif
39 BranchProbability::BranchProbability(uint32_t Numerator, uint32_t Denominator) {
40 assert(Denominator > 0 && "Denominator cannot be 0!");
41 assert(Numerator <= Denominator && "Probability cannot be bigger than 1!");
42 if (Denominator == D)
43 N = Numerator;
44 else {
45 uint64_t Prob64 =
46 (Numerator * static_cast<uint64_t>(D) + Denominator / 2) / Denominator;
47 N = static_cast<uint32_t>(Prob64);
51 BranchProbability
52 BranchProbability::getBranchProbability(uint64_t Numerator,
53 uint64_t Denominator) {
54 assert(Numerator <= Denominator && "Probability cannot be bigger than 1!");
55 // Scale down Denominator to fit in a 32-bit integer.
56 int Scale = 0;
57 while (Denominator > UINT32_MAX) {
58 Denominator >>= 1;
59 Scale++;
61 return BranchProbability(Numerator >> Scale, Denominator);
64 // If ConstD is not zero, then replace D by ConstD so that division and modulo
65 // operations by D can be optimized, in case this function is not inlined by the
66 // compiler.
67 template <uint32_t ConstD>
68 static uint64_t scale(uint64_t Num, uint32_t N, uint32_t D) {
69 if (ConstD > 0)
70 D = ConstD;
72 assert(D && "divide by 0");
74 // Fast path for multiplying by 1.0.
75 if (!Num || D == N)
76 return Num;
78 // Split Num into upper and lower parts to multiply, then recombine.
79 uint64_t ProductHigh = (Num >> 32) * N;
80 uint64_t ProductLow = (Num & UINT32_MAX) * N;
82 // Split into 32-bit digits.
83 uint32_t Upper32 = ProductHigh >> 32;
84 uint32_t Lower32 = ProductLow & UINT32_MAX;
85 uint32_t Mid32Partial = ProductHigh & UINT32_MAX;
86 uint32_t Mid32 = Mid32Partial + (ProductLow >> 32);
88 // Carry.
89 Upper32 += Mid32 < Mid32Partial;
91 uint64_t Rem = (uint64_t(Upper32) << 32) | Mid32;
92 uint64_t UpperQ = Rem / D;
94 // Check for overflow.
95 if (UpperQ > UINT32_MAX)
96 return UINT64_MAX;
98 Rem = ((Rem % D) << 32) | Lower32;
99 uint64_t LowerQ = Rem / D;
100 uint64_t Q = (UpperQ << 32) + LowerQ;
102 // Check for overflow.
103 return Q < LowerQ ? UINT64_MAX : Q;
106 uint64_t BranchProbability::scale(uint64_t Num) const {
107 return ::scale<D>(Num, N, D);
110 uint64_t BranchProbability::scaleByInverse(uint64_t Num) const {
111 return ::scale<0>(Num, D, N);