docs/cpp/saturated__arithmetic_8h_source.html

// Copyright 2010-2025 Google LLC

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

//

//     http://www.apache.org/licenses/LICENSE-2.0

//

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.


#ifndef OR_TOOLS_UTIL_SATURATED_ARITHMETIC_H_

#define OR_TOOLS_UTIL_SATURATED_ARITHMETIC_H_


#include <cstdint>

#include <limits>

#include <type_traits>


#include "absl/base/casts.h"

#include "absl/log/check.h"

#include "ortools/base/types.h"

#include "ortools/util/bitset.h"


// This file contains implementations for saturated addition, subtraction and

// multiplication.

// Currently, there are three versions of the code.

// The code using the built-ins provided since GCC 5.0 now compiles really well

// with clang/LLVM on both x86_64 and ARM. It should therefore be the standard,

// but not for multiplication, see below.

//

// For example, on ARM, only 4 instructions are needed, two of which are

// additions that can be executed in parallel.

//

// On x86_64, we're keeping the code with inline assembly for GCC as GCC does

// manage to compile the code with built-ins properly.

// On x86_64, the product of two 64-bit registers is a 128-bit integer

// stored in two 64-bit registers. It's the carry flag that is set when the

// result exceeds 64 bits, not the overflow flag. Since the built-in uses the

// overflow flag, we have to resort on the assembly-based version of the code.

//

// Sadly, MSVC does not support the built-ins nor does it support inline

// assembly. We have to rely on the generic, C++ only version of the code which

// is much slower.

//

// TODO(user): make this implementation the default everywhere.

// TODO(user): investigate the code generated by MSVC.


namespace operations_research {


// Checks if x is equal to the min or the max value of an int64_t.


inline bool AtMinOrMaxInt64(int64_t x) {

  return x == std::numeric_limits<int64_t>::min() ||

         x == std::numeric_limits<int64_t>::max();

}


// Note(user): -kint64min != kint64max, but kint64max == ~kint64min.

inline int64_t CapOpp(int64_t v) { return v == kint64min ? ~v : -v; }


inline int64_t CapAbs(int64_t v) {

  return v == kint64min ? std::numeric_limits<int64_t>::max()

                        : (v < 0 ? -v : v);

}


// ---------- Overflow utility functions ----------


// Implement two's complement addition and subtraction on int64s.

//

// The C and C++ standards specify that the overflow of signed integers is

// undefined. This is because of the different possible representations that may

// be used for signed integers (one's complement, two's complement, sign and

// magnitude). Such overflows are detected by Address Sanitizer with

// -fsanitize=signed-integer-overflow.

//

// Simple, portable overflow detection on current machines relies on

// these two functions. For example, if the sign of the sum of two positive

// integers is negative, there has been an overflow.

//

// Note that the static assert will break if the code is compiled on machines

// which do not use two's complement.


inline int64_t TwosComplementAddition(int64_t x, int64_t y) {

  static_assert(static_cast<uint64_t>(-1LL) == ~0ULL,

                "The target architecture does not use two's complement.");

  return absl::bit_cast<int64_t>(static_cast<uint64_t>(x) +

                                 static_cast<uint64_t>(y));

}


inline int64_t TwosComplementSubtraction(int64_t x, int64_t y) {

  static_assert(static_cast<uint64_t>(-1LL) == ~0ULL,

                "The target architecture does not use two's complement.");

  return absl::bit_cast<int64_t>(static_cast<uint64_t>(x) -

                                 static_cast<uint64_t>(y));

}


// Helper function that returns true if an overflow has occurred in computing

// sum = x + y. sum is expected to be computed elsewhere.


inline bool AddHadOverflow(int64_t x, int64_t y, int64_t sum) {

  // Overflow cannot occur if operands have different signs.

  // It can only occur if sign(x) == sign(y) and sign(sum) != sign(x),

  // which is equivalent to: sign(x) != sign(sum) && sign(y) != sign(sum).

  // This is captured when the expression below is negative.

  DCHECK_EQ(sum, TwosComplementAddition(x, y));

  return ((x ^ sum) & (y ^ sum)) < 0;

}


inline bool SubHadOverflow(int64_t x, int64_t y, int64_t diff) {

  // This is the same reasoning as for AddHadOverflow. We have x = diff + y.

  // The formula is the same, with 'x' and diff exchanged.

  DCHECK_EQ(diff, TwosComplementSubtraction(x, y));

  return AddHadOverflow(diff, y, x);

}


// A note on overflow treatment.

// kint64min and kint64max are treated as infinity.

// Thus if the computation overflows, the result is always kint64m(ax/in).

//

// Note(user): this is actually wrong: when computing A-B, if A is kint64max

// and B is finite, then A-B won't be kint64max: overflows aren't sticky.

// TODO(user): consider making some operations overflow-sticky, some others

// not, but make an explicit choice throughout.


inline bool AddOverflows(int64_t x, int64_t y) {

  return AddHadOverflow(x, y, TwosComplementAddition(x, y));

}


inline int64_t SubOverflows(int64_t x, int64_t y) {

  return SubHadOverflow(x, y, TwosComplementSubtraction(x, y));

}


// Performs *b += a and returns false iff the addition overflow or underflow.

// This function only works for typed integer type (IntType<>).

template <typename IntegerType>


bool SafeAddInto(IntegerType a, IntegerType* b) {

  const int64_t x = a.value();

  const int64_t y = b->value();

  const int64_t sum = TwosComplementAddition(x, y);

  if (AddHadOverflow(x, y, sum)) return false;

  *b = sum;

  return true;

}


// Returns kint64max if x >= 0 and kint64min if x < 0.


inline int64_t CapWithSignOf(int64_t x) {

  // return kint64max if x >= 0 or kint64max + 1 (== kint64min) if x < 0.

  return TwosComplementAddition(kint64max, static_cast<int64_t>(x < 0));

}


// The following implementations are here for GCC because it does not

// compiled the built-ins correctly. The code is either too long without

// branches or contains jumps. These implementations are probably optimal

// on x86_64.

#if defined(__GNUC__) && !defined(__clang_) && defined(__x86_64__)

inline int64_t CapAddAsm(int64_t x, int64_t y) {

  const int64_t cap = CapWithSignOf(x);

  int64_t result = x;

  // clang-format off

  asm volatile(  // 'volatile': ask compiler optimizer "keep as is".

      "\t" "addq %[y],%[result]"

      "\n\t" "cmovoq %[cap],%[result]"  // Conditional move if overflow.

      : [result] "=r"(result)  // Output

      : "[result]" (result), [y] "r"(y), [cap] "r"(cap)  // Input.

      : "cc"  /* Clobbered registers */  );

  // clang-format on

  return result;

}


inline int64_t CapSubAsm(int64_t x, int64_t y) {

  const int64_t cap = CapWithSignOf(x);

  int64_t result = x;

  // clang-format off

  asm volatile(  // 'volatile': ask compiler optimizer "keep as is".

      "\t" "subq %[y],%[result]"

      "\n\t" "cmovoq %[cap],%[result]"  // Conditional move if overflow.

      : [result] "=r"(result)  // Output

      : "[result]" (result), [y] "r"(y), [cap] "r"(cap)  // Input.

      : "cc"  /* Clobbered registers */  );

  // clang-format on

  return result;

}


// Note that on x86_64, we have to use this code because it's the carry flag

// that is set when the product of two 64-bit integers does not fit in 64-bit.

inline int64_t CapProdAsm(int64_t x, int64_t y) {

  // cap = kint64max if x and y have the same sign, cap = kint64min

  // otherwise.

  const int64_t cap = CapWithSignOf(x ^ y);

  int64_t result = x;

  // Here, we use the fact that imul of two signed 64-integers returns a 128-bit

  // result -- we care about the lower 64 bits. More importantly, imul also sets

  // the carry flag if 64 bits were not enough.

  // We therefore use cmovc to return cap if the carry was set.

  // clang-format off

  asm volatile(  // 'volatile': ask compiler optimizer "keep as is".

      "\n\t" "imulq %[y],%[result]"

      "\n\t" "cmovcq %[cap],%[result]"  // Conditional move if carry.

      : [result] "=r"(result)  // Output

      : "[result]" (result), [y] "r"(y), [cap] "r"(cap)  // Input.

      : "cc" /* Clobbered registers */);

  // clang-format on

  return result;

}

#endif


// Simple implementations which use the built-ins provided by both GCC and

// clang. clang compiles to very good code for both x86_64 and ARM. This is the

// preferred implementation in general.

#if defined(__clang__)

inline int64_t CapAddBuiltIn(int64_t x, int64_t y) {

  const int64_t cap = CapWithSignOf(x);

  int64_t result;

  const bool overflowed = __builtin_add_overflow(x, y, &result);

  return overflowed ? cap : result;

}


inline int64_t CapSubBuiltIn(int64_t x, int64_t y) {

  const int64_t cap = CapWithSignOf(x);

  int64_t result;

  const bool overflowed = __builtin_sub_overflow(x, y, &result);

  return overflowed ? cap : result;

}


// As said above, this is useless on x86_64.

inline int64_t CapProdBuiltIn(int64_t x, int64_t y) {

  const int64_t cap = CapWithSignOf(x ^ y);

  int64_t result;

  const bool overflowed = __builtin_mul_overflow(x, y, &result);

  return overflowed ? cap : result;

}

#endif


// Generic implementations. They are very good for addition and subtraction,

// less so for multiplication.


inline int64_t CapAddGeneric(int64_t x, int64_t y) {

  const int64_t result = TwosComplementAddition(x, y);

  return AddHadOverflow(x, y, result) ? CapWithSignOf(x) : result;

}


inline int64_t CapSubGeneric(int64_t x, int64_t y) {

  const int64_t result = TwosComplementSubtraction(x, y);

  return SubHadOverflow(x, y, result) ? CapWithSignOf(x) : result;

}


namespace cap_prod_util {

// Returns an unsigned int equal to the absolute value of n, in a way that

// will not produce overflows.


inline uint64_t uint_abs(int64_t n) {

  return n < 0 ? ~static_cast<uint64_t>(n) + 1 : static_cast<uint64_t>(n);

}


}  // namespace cap_prod_util


// The generic algorithm computes a bound on the number of bits necessary to

// store the result. For this it uses the position of the most significant bits

// of each of the arguments.

// If the result needs at least 64 bits, then return a capped value.

// If the result needs at most 63 bits, then return the product.

// Otherwise, the result may use 63 or 64 bits: compute the product

// as a uint64_t, and cap it if necessary.


inline int64_t CapProdGeneric(int64_t x, int64_t y) {

  const uint64_t a = cap_prod_util::uint_abs(x);

  const uint64_t b = cap_prod_util::uint_abs(y);

  // Let MSB(x) denote the most significant bit of x. We have:

  // MSB(x) + MSB(y) <= MSB(x * y) <= MSB(x) + MSB(y) + 1

  const int msb_sum =

      MostSignificantBitPosition64(a) + MostSignificantBitPosition64(b);

  const int kMaxBitIndexInInt64 = 63;

  if (msb_sum <= kMaxBitIndexInInt64 - 2) return x * y;

  // Catch a == 0 or b == 0 now, as MostSignificantBitPosition64(0) == 0.

  // TODO(user): avoid this by writing function Log2(a) with Log2(0) == -1.

  if (a == 0 || b == 0) return 0;

  const int64_t cap = CapWithSignOf(x ^ y);

  if (msb_sum >= kMaxBitIndexInInt64) return cap;

  // The corner case is when msb_sum == 62, i.e. at least 63 bits will be

  // needed to store the product. The following product will never overflow

  // on uint64_t, since msb_sum == 62.

  const uint64_t u_prod = a * b;

  // The overflow cases are captured by one of the following conditions:

  // (cap >= 0 && u_prod >= static_cast<uint64_t>(kint64max) or

  // (cap < 0 && u_prod >= static_cast<uint64_t>(kint64min)).

  // These can be optimized as follows (and if the condition is false, it is

  // safe to compute x * y.

  if (u_prod >= static_cast<uint64_t>(cap)) return cap;

  const int64_t abs_result = absl::bit_cast<int64_t>(u_prod);

  return cap < 0 ? -abs_result : abs_result;

}


// A generic, safer version of CapAdd() where we don't silently convert double

// or int32_t to int64_t. When the inputs are floating-point, uses '+', else

// uses CapAdd() for int64_t, and a (slow-ish) int32_t version for int.

template <typename T>

T CapOrFloatAdd(T x, T y);


inline int64_t CapAdd(int64_t x, int64_t y) {

#if defined(__GNUC__) && !defined(__clang__) && defined(__x86_64__)

  return CapAddAsm(x, y);

#elif defined(__clang__)

  return CapAddBuiltIn(x, y);

#else

  return CapAddGeneric(x, y);

#endif

}


// This avoid the need to convert to int64_t min/max and is about twice as fast

// if it corresponds to your use case.


inline bool AddIntoOverflow(int64_t x, int64_t* y) {

#if defined(__clang__)

  return __builtin_add_overflow(x, *y, y);

#else

  const int64_t result = TwosComplementAddition(x, *y);

  if (AddHadOverflow(x, *y, result)) return true;

  *y = result;

  return false;

#endif

}


inline void CapAddTo(int64_t x, int64_t* y) { *y = CapAdd(*y, x); }


inline int64_t CapSub(int64_t x, int64_t y) {

#if defined(__GNUC__) && !defined(__clang__) && defined(__x86_64__)

  return CapSubAsm(x, y);

#elif defined(__clang__)

  return CapSubBuiltIn(x, y);

#else

  return CapSubGeneric(x, y);

#endif

}


// Updates *target with CapSub(*target, amount).


inline void CapSubFrom(int64_t amount, int64_t* target) {

  *target = CapSub(*target, amount);

}


inline int64_t CapProd(int64_t x, int64_t y) {

#if defined(__GNUC__) && defined(__x86_64__)

  // On x86_64, the product of two 64-bit registeres is a 128-bit integer,

  // stored in two 64-bit registers. It's the carry flag that is set when the

  // result exceeds 64 bits, not the overflow flag. We therefore have to resort

  // to the assembly-based version of the code.

  return CapProdAsm(x, y);

#elif defined(__clang__)

  return CapProdBuiltIn(x, y);

#else

  return CapProdGeneric(x, y);

#endif

}


template <typename T>


T CapOrFloatAdd(T x, T y) {

  static_assert(std::is_floating_point_v<T> || std::is_integral_v<T>);

  if constexpr (std::is_integral_v<T>) {

    if constexpr (std::is_same_v<T, int64_t>) {

      return CapAdd(x, y);

    } else {

      static_assert(

          std::is_same_v<T, int32_t>,

          "CapOrFloatAdd() on integers only works for int and int64_t");

      const int64_t sum = int64_t{x} + y;

      return sum > kint32max ? kint32max : sum < kint32min ? kint32min : sum;

    }

  } else {

    return x + y;

  }

}


}  // namespace operations_research


#endif  // OR_TOOLS_UTIL_SATURATED_ARITHMETIC_H_

bitset.h

operations_research::cap_prod_util
Definition saturated_arithmetic.h:243

operations_research::cap_prod_util::uint_abs
uint64_t uint_abs(int64_t n)
Definition saturated_arithmetic.h:246

operations_research::math_opt::x
const Variable x
Definition infeasible_subsystem_tests.cc:205

operations_research
In SWIG mode, we don't want anything besides these top-level includes.
Definition binary_indexed_tree.h:21

operations_research::SubOverflows
int64_t SubOverflows(int64_t x, int64_t y)
Definition saturated_arithmetic.h:126

operations_research::AtMinOrMaxInt64
bool AtMinOrMaxInt64(int64_t x)
Checks if x is equal to the min or the max value of an int64_t.
Definition saturated_arithmetic.h:53

operations_research::AddHadOverflow
bool AddHadOverflow(int64_t x, int64_t y, int64_t sum)
Definition saturated_arithmetic.h:98

operations_research::CapAdd
int64_t CapAdd(int64_t x, int64_t y)
Definition saturated_arithmetic.h:292

operations_research::CapAddTo
void CapAddTo(int64_t x, int64_t *y)
Definition saturated_arithmetic.h:315

operations_research::CapWithSignOf
int64_t CapWithSignOf(int64_t x)
Returns kint64max if x >= 0 and kint64min if x < 0.
Definition saturated_arithmetic.h:143

operations_research::TwosComplementAddition
int64_t TwosComplementAddition(int64_t x, int64_t y)
-------— Overflow utility functions -------—
Definition saturated_arithmetic.h:82

operations_research::CapSub
int64_t CapSub(int64_t x, int64_t y)
Definition saturated_arithmetic.h:317

operations_research::CapSubFrom
void CapSubFrom(int64_t amount, int64_t *target)
Updates *target with CapSub(*target, amount).
Definition saturated_arithmetic.h:328

operations_research::AddIntoOverflow
bool AddIntoOverflow(int64_t x, int64_t *y)
Definition saturated_arithmetic.h:304

operations_research::CapAddGeneric
int64_t CapAddGeneric(int64_t x, int64_t y)
Definition saturated_arithmetic.h:233

operations_research::CapOrFloatAdd
T CapOrFloatAdd(T x, T y)
Definition saturated_arithmetic.h:347

operations_research::AddOverflows
bool AddOverflows(int64_t x, int64_t y)
Definition saturated_arithmetic.h:122

operations_research::CapProd
int64_t CapProd(int64_t x, int64_t y)
Definition saturated_arithmetic.h:332

operations_research::SubHadOverflow
bool SubHadOverflow(int64_t x, int64_t y, int64_t diff)
Definition saturated_arithmetic.h:107

operations_research::TwosComplementSubtraction
int64_t TwosComplementSubtraction(int64_t x, int64_t y)
Definition saturated_arithmetic.h:89

operations_research::CapAbs
int64_t CapAbs(int64_t v)
Definition saturated_arithmetic.h:61

operations_research::CapProdGeneric
int64_t CapProdGeneric(int64_t x, int64_t y)
Definition saturated_arithmetic.h:258

operations_research::SafeAddInto
bool SafeAddInto(IntegerType a, IntegerType *b)
Definition saturated_arithmetic.h:133

operations_research::CapSubGeneric
int64_t CapSubGeneric(int64_t x, int64_t y)
Definition saturated_arithmetic.h:238

operations_research::CapOpp
int64_t CapOpp(int64_t v)
Note(user): -kint64min != kint64max, but kint64max == ~kint64min.
Definition saturated_arithmetic.h:59

operations_research::MostSignificantBitPosition64
int MostSignificantBitPosition64(uint64_t n)
Definition bitset.h:234

types.h

kint32min
static const int32_t kint32min
Definition types.h:29

kint64max
static const int64_t kint64max
Definition types.h:32

kint32max
static const int32_t kint32max
Definition types.h:30

kint64min
static const int64_t kint64min
Definition types.h:31