llvm-project/llvm/lib/Support/BlockFrequency.cpp

//====--------------- lib/Support/BlockFrequency.cpp -----------*- C++ -*-====//
//
//                     The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
// This file implements Block Frequency class.
//
//===----------------------------------------------------------------------===//

#include "llvm/Support/BranchProbability.h"
#include "llvm/Support/BlockFrequency.h"
#include "llvm/Support/raw_ostream.h"
#include <cassert>

using namespace llvm;

/// Multiply FREQ by N and store result in W array.
static void mult96bit(uint64_t freq, uint32_t N, uint64_t W[2]) {
  uint64_t u0 = freq & UINT32_MAX;
  uint64_t u1 = freq >> 32;

  // Represent 96-bit value as w[2]:w[1]:w[0];
  uint32_t w[3] = { 0, 0, 0 };

  uint64_t t = u0 * N;
  uint64_t k = t >> 32;
  w[0] = t;
  t = u1 * N + k;
  w[1] = t;
  w[2] = t >> 32;

  // W[1] - higher bits.
  // W[0] - lower bits.
  W[0] = w[0] + ((uint64_t) w[1] << 32);
  W[1] = w[2];
}


/// Divide 96-bit value stored in W array by D.
/// Return 64-bit quotient, saturated to UINT64_MAX on overflow.
static uint64_t div96bit(uint64_t W[2], uint32_t D) {
  uint64_t y = W[0];
  uint64_t x = W[1];
  unsigned i;

  assert(x != 0 && "This is really a 64-bit division");

  // This long division algorithm automatically saturates on overflow.
  for (i = 0; i < 64 && x; ++i) {
    uint32_t t = -((x >> 31) & 1); // Splat bit 31 to bits 0-31.
    x = (x << 1) | (y >> 63);
    y = y << 1;
    if ((x | t) >= D) {
      x -= D;
      ++y;
    }
  }

  return y << (64 - i);
}


void BlockFrequency::scale(uint32_t N, uint32_t D) {
  assert(D != 0 && "Division by zero");

  // Calculate Frequency * N.
  uint64_t MulLo = (Frequency & UINT32_MAX) * N;
  uint64_t MulHi = (Frequency >> 32) * N;
  uint64_t MulRes = (MulHi << 32) + MulLo;

  // If the product fits in 64 bits, just use built-in division.
  if (MulHi <= UINT32_MAX && MulRes >= MulLo) {
    Frequency = MulRes / D;
    return;
  }

  // Product overflowed, use 96-bit operations.
  // 96-bit value represented as W[1]:W[0].
  uint64_t W[2];
  mult96bit(Frequency, N, W);
  Frequency = div96bit(W, D);
  return;
}

BlockFrequency &BlockFrequency::operator*=(const BranchProbability &Prob) {
  scale(Prob.getNumerator(), Prob.getDenominator());
  return *this;
}

const BlockFrequency
BlockFrequency::operator*(const BranchProbability &Prob) const {
  BlockFrequency Freq(Frequency);
  Freq *= Prob;
  return Freq;
}

BlockFrequency &BlockFrequency::operator/=(const BranchProbability &Prob) {
  scale(Prob.getDenominator(), Prob.getNumerator());
  return *this;
}

BlockFrequency BlockFrequency::operator/(const BranchProbability &Prob) const {
  BlockFrequency Freq(Frequency);
  Freq /= Prob;
  return Freq;
}

BlockFrequency &BlockFrequency::operator+=(const BlockFrequency &Freq) {
  uint64_t Before = Freq.Frequency;
  Frequency += Freq.Frequency;

  // If overflow, set frequency to the maximum value.
  if (Frequency < Before)
    Frequency = UINT64_MAX;

  return *this;
}

const BlockFrequency
BlockFrequency::operator+(const BlockFrequency &Prob) const {
  BlockFrequency Freq(Frequency);
  Freq += Prob;
  return Freq;
}

void BlockFrequency::print(raw_ostream &OS) const {
  // Convert fixed-point number to decimal.
  OS << Frequency / getEntryFrequency() << ".";
  uint64_t Rem = Frequency % getEntryFrequency();
  uint64_t Eps = 1;
  do {
    Rem *= 10;
    Eps *= 10;
    OS << Rem / getEntryFrequency();
    Rem = Rem % getEntryFrequency();
  } while (Rem >= Eps/2);
}

namespace llvm {

raw_ostream &operator<<(raw_ostream &OS, const BlockFrequency &Freq) {
  Freq.print(OS);
  return OS;
}

}
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`//====--------------- lib/Support/BlockFrequency.cpp ------------ C++ --====//`
			`//`
			`// The LLVM Compiler Infrastructure`
			`//`
			`// This file is distributed under the University of Illinois Open Source`
			`// License. See LICENSE.TXT for details.`
			`//`
			`//===----------------------------------------------------------------------===//`
			`//`
			`// This file implements Block Frequency class.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "llvm/Support/BranchProbability.h"`
			`#include "llvm/Support/BlockFrequency.h"`
			`#include "llvm/Support/raw_ostream.h"`
			`#include <cassert>`

			`using namespace llvm;`

Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`/// Multiply FREQ by N and store result in W array.`
			`static void mult96bit(uint64_t freq, uint32_t N, uint64_t W[2]) {`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`uint64_t u0 = freq & UINT32_MAX;`
			`uint64_t u1 = freq >> 32;`

			`// Represent 96-bit value as w[2]:w[1]:w[0];`
			`uint32_t w[3] = { 0, 0, 0 };`

			`uint64_t t = u0 * N;`
			`uint64_t k = t >> 32;`
			`w[0] = t;`
			`t = u1 * N + k;`
			`w[1] = t;`
			`w[2] = t >> 32;`

			`// W[1] - higher bits.`
			`// W[0] - lower bits.`
			`W[0] = w[0] + ((uint64_t) w[1] << 32);`
			`W[1] = w[2];`
			`}`


Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`/// Divide 96-bit value stored in W array by D.`
Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`/// Return 64-bit quotient, saturated to UINT64_MAX on overflow.`
Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`static uint64_t div96bit(uint64_t W[2], uint32_t D) {`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`uint64_t y = W[0];`
			`uint64_t x = W[1];`
Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`unsigned i;`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00
Fix a bad overflow check pointed out by Ben. llvm-svn: 185226 2013-06-29 05:51:18 +08:00			`assert(x != 0 && "This is really a 64-bit division");`
Eliminate an assortment of undefined behavior. Hopefully, this fixes the PPC64 buildbots. llvm-svn: 185218 2013-06-29 05:10:25 +08:00
Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`// This long division algorithm automatically saturates on overflow.`
Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`for (i = 0; i < 64 && x; ++i) {`
Eliminate an assortment of undefined behavior. Hopefully, this fixes the PPC64 buildbots. llvm-svn: 185218 2013-06-29 05:10:25 +08:00			`uint32_t t = -((x >> 31) & 1); // Splat bit 31 to bits 0-31.`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`x = (x << 1) \| (y >> 63);`
			`y = y << 1;`
			`if ((x \| t) >= D) {`
			`x -= D;`
			`++y;`
			`}`
			`}`

Stylistic cleanups, no functional change. - Use static functions instead of anonymous namespace. - Appease the Doxygen lobby. - Use 0-based induction variable. llvm-svn: 185185 2013-06-29 02:33:19 +08:00			`return y << (64 - i);`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`}`

Move static methods to the anonymous namespace. llvm-svn: 136221 2011-07-27 23:51:51 +08:00
Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`void BlockFrequency::scale(uint32_t N, uint32_t D) {`
			`assert(D != 0 && "Division by zero");`
Move static methods to the anonymous namespace. llvm-svn: 136221 2011-07-27 23:51:51 +08:00
Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`// Calculate Frequency * N.`
			`uint64_t MulLo = (Frequency & UINT32_MAX) * N;`
			`uint64_t MulHi = (Frequency >> 32) * N;`
			`uint64_t MulRes = (MulHi << 32) + MulLo;`

			`// If the product fits in 64 bits, just use built-in division.`
Fix a bad overflow check pointed out by Ben. llvm-svn: 185226 2013-06-29 05:51:18 +08:00			`if (MulHi <= UINT32_MAX && MulRes >= MulLo) {`
Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`Frequency = MulRes / D;`
			`return;`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`}`

Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`// Product overflowed, use 96-bit operations.`
			`// 96-bit value represented as W[1]:W[0].`
			`uint64_t W[2];`
			`mult96bit(Frequency, N, W);`
			`Frequency = div96bit(W, D);`
			`return;`
			`}`

			`BlockFrequency &BlockFrequency::operator*=(const BranchProbability &Prob) {`
			`scale(Prob.getNumerator(), Prob.getDenominator());`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`return *this;`
			`}`

			`const BlockFrequency`
			`BlockFrequency::operator*(const BranchProbability &Prob) const {`
			`BlockFrequency Freq(Frequency);`
			`Freq *= Prob;`
			`return Freq;`
			`}`

Add a division operator to BlockFrequency. Allow a BlockFrequency to be divided by a non-zero BranchProbability with saturating arithmetic. This will be used to compute the frequency of a loop header given the probability of leaving the loop. Our long division algorithm already saturates on overflow, so that was a freebie. llvm-svn: 185184 2013-06-29 02:23:42 +08:00			`BlockFrequency &BlockFrequency::operator/=(const BranchProbability &Prob) {`
			`scale(Prob.getDenominator(), Prob.getNumerator());`
			`return *this;`
			`}`

			`BlockFrequency BlockFrequency::operator/(const BranchProbability &Prob) const {`
			`BlockFrequency Freq(Frequency);`
			`Freq /= Prob;`
			`return Freq;`
			`}`

Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`BlockFrequency &BlockFrequency::operator+=(const BlockFrequency &Freq) {`
			`uint64_t Before = Freq.Frequency;`
			`Frequency += Freq.Frequency;`

			`// If overflow, set frequency to the maximum value.`
			`if (Frequency < Before)`
			`Frequency = UINT64_MAX;`

			`return *this;`
			`}`

			`const BlockFrequency`
			`BlockFrequency::operator+(const BlockFrequency &Prob) const {`
			`BlockFrequency Freq(Frequency);`
			`Freq += Prob;`
			`return Freq;`
			`}`

			`void BlockFrequency::print(raw_ostream &OS) const {`
Print block frequencies in decimal form. This is easier to read than the internal fixed-point representation. If anybody knows the correct algorithm for converting fixed-point numbers to base 10, feel free to fix it. llvm-svn: 184881 2013-06-26 05:57:38 +08:00			`// Convert fixed-point number to decimal.`
			`OS << Frequency / getEntryFrequency() << ".";`
			`uint64_t Rem = Frequency % getEntryFrequency();`
			`uint64_t Eps = 1;`
			`do {`
			`Rem *= 10;`
			`Eps *= 10;`
			`OS << Rem / getEntryFrequency();`
			`Rem = Rem % getEntryFrequency();`
			`} while (Rem >= Eps/2);`
Add BlockFrequency class. llvm-svn: 135992 2011-07-26 06:24:51 +08:00			`}`

			`namespace llvm {`

			`raw_ostream &operator<<(raw_ostream &OS, const BlockFrequency &Freq) {`
			`Freq.print(OS);`
			`return OS;`
			`}`

			`}`