d43b7997c0
-- 7a9e8d95f795be037aa2dce4e44809ad0166aaec by Samuel Benzaquen <sbenza@google.com>: Make end() iterator be nullptr. This makes the creation of and comparison with end() smaller and faster. `find()!=end()` becomes leaner. PiperOrigin-RevId: 304681605 -- 8f3024979446b391b79b1b60ada7d00a504d6aa6 by Derek Mauro <dmauro@google.com>: Fix Bazel's distdir detection and prefer double brackets (bash recommendation) PiperOrigin-RevId: 304615725 -- f1d709cb4b2b3743d548b814dd19602fb057a5e6 by Abseil Team <absl-team@google.com>: Internal change PiperOrigin-RevId: 304570545 -- 2bbfa5bda52057e1938a96c286ad33ff64e535e0 by Gennadiy Rozental <rogeeff@google.com>: Implement general storage case as aligned buffer. Aside from eliminating dynamic memory allocation for flag storage, we also saving 11 bytes per int flag, 15 bytes per double and string flag. PiperOrigin-RevId: 304511965 -- 9e1aed2a95d7d060f8b906fe8c67fc3ba537b521 by Derek Mauro <dmauro@google.com>: Use reserve to make a bad_alloc less likely in endian_test This happened once and shouldn't have happened, so it was probably just a flake, but might as well make this change. PiperOrigin-RevId: 304505572 -- c2faf22ba2d4d66753390e6959494214895581f0 by Gennadiy Rozental <rogeeff@google.com>: Use anonymous bit fields to enforce separation between const and mutable bit fields. We also move init_control field (which is now safe) to save 8 bytes per flag (based on size_tester output) PiperOrigin-RevId: 304505215 -- 7ec51250a84bb03e826b3caad64431e91748186a by Krzysztof Kosiński <krzysio@google.com>: Change the buffer size in AppendNumberUnit to constexpr. PiperOrigin-RevId: 304492779 -- a6c8db1be4f421ea7b7c02f7a01b4f48bad61883 by Gennadiy Rozental <rogeeff@google.com>: Add test cases for two word storage. Some additional tests were added for other storage kinds as well. These came about after I started to look into a coverage output and noticed that some cases (like reading flag values via reflection) were not covered by this test at all. It does not make sense to just add tests for two word values, so I've covered other storage kinds as well. PiperOrigin-RevId: 304432511 -- 2644ecc32e1215cd6451efcb2f1054fd77e7c812 by Abseil Team <absl-team@google.com>: Internal change PiperOrigin-RevId: 304254681 -- 4949a6b20c2bb4b9b2c811f439ccb893abc08df5 by Abseil Team <absl-team@google.com>: Internal change PiperOrigin-RevId: 304250274 GitOrigin-RevId: 7a9e8d95f795be037aa2dce4e44809ad0166aaec Change-Id: I01623de87355bec5cf87cc5932a1ca44cade9aae
111 lines
3.8 KiB
C++
111 lines
3.8 KiB
C++
// Copyright 2017 The Abseil Authors.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// https://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#ifndef ABSL_RANDOM_INTERNAL_WIDE_MULTIPLY_H_
|
|
#define ABSL_RANDOM_INTERNAL_WIDE_MULTIPLY_H_
|
|
|
|
#include <cstdint>
|
|
#include <limits>
|
|
#include <type_traits>
|
|
|
|
#if (defined(_WIN32) || defined(_WIN64)) && defined(_M_IA64)
|
|
#include <intrin.h> // NOLINT(build/include_order)
|
|
#pragma intrinsic(_umul128)
|
|
#define ABSL_INTERNAL_USE_UMUL128 1
|
|
#endif
|
|
|
|
#include "absl/base/config.h"
|
|
#include "absl/base/internal/bits.h"
|
|
#include "absl/numeric/int128.h"
|
|
#include "absl/random/internal/traits.h"
|
|
|
|
namespace absl {
|
|
ABSL_NAMESPACE_BEGIN
|
|
namespace random_internal {
|
|
|
|
// Helper object to multiply two 64-bit values to a 128-bit value.
|
|
// MultiplyU64ToU128 multiplies two 64-bit values to a 128-bit value.
|
|
// If an intrinsic is available, it is used, otherwise use native 32-bit
|
|
// multiplies to construct the result.
|
|
inline absl::uint128 MultiplyU64ToU128(uint64_t a, uint64_t b) {
|
|
#if defined(ABSL_HAVE_INTRINSIC_INT128)
|
|
return absl::uint128(static_cast<__uint128_t>(a) * b);
|
|
#elif defined(ABSL_INTERNAL_USE_UMUL128)
|
|
// uint64_t * uint64_t => uint128 multiply using imul intrinsic on MSVC.
|
|
uint64_t high = 0;
|
|
const uint64_t low = _umul128(a, b, &high);
|
|
return absl::MakeUint128(high, low);
|
|
#else
|
|
// uint128(a) * uint128(b) in emulated mode computes a full 128-bit x 128-bit
|
|
// multiply. However there are many cases where that is not necessary, and it
|
|
// is only necessary to support a 64-bit x 64-bit = 128-bit multiply. This is
|
|
// for those cases.
|
|
const uint64_t a00 = static_cast<uint32_t>(a);
|
|
const uint64_t a32 = a >> 32;
|
|
const uint64_t b00 = static_cast<uint32_t>(b);
|
|
const uint64_t b32 = b >> 32;
|
|
|
|
const uint64_t c00 = a00 * b00;
|
|
const uint64_t c32a = a00 * b32;
|
|
const uint64_t c32b = a32 * b00;
|
|
const uint64_t c64 = a32 * b32;
|
|
|
|
const uint32_t carry =
|
|
static_cast<uint32_t>(((c00 >> 32) + static_cast<uint32_t>(c32a) +
|
|
static_cast<uint32_t>(c32b)) >>
|
|
32);
|
|
|
|
return absl::MakeUint128(c64 + (c32a >> 32) + (c32b >> 32) + carry,
|
|
c00 + (c32a << 32) + (c32b << 32));
|
|
#endif
|
|
}
|
|
|
|
// wide_multiply<T> multiplies two N-bit values to a 2N-bit result.
|
|
template <typename UIntType>
|
|
struct wide_multiply {
|
|
static constexpr size_t kN = std::numeric_limits<UIntType>::digits;
|
|
using input_type = UIntType;
|
|
using result_type = typename random_internal::unsigned_bits<kN * 2>::type;
|
|
|
|
static result_type multiply(input_type a, input_type b) {
|
|
return static_cast<result_type>(a) * b;
|
|
}
|
|
|
|
static input_type hi(result_type r) { return r >> kN; }
|
|
static input_type lo(result_type r) { return r; }
|
|
|
|
static_assert(std::is_unsigned<UIntType>::value,
|
|
"Class-template wide_multiply<> argument must be unsigned.");
|
|
};
|
|
|
|
#ifndef ABSL_HAVE_INTRINSIC_INT128
|
|
template <>
|
|
struct wide_multiply<uint64_t> {
|
|
using input_type = uint64_t;
|
|
using result_type = absl::uint128;
|
|
|
|
static result_type multiply(uint64_t a, uint64_t b) {
|
|
return MultiplyU64ToU128(a, b);
|
|
}
|
|
|
|
static uint64_t hi(result_type r) { return absl::Uint128High64(r); }
|
|
static uint64_t lo(result_type r) { return absl::Uint128Low64(r); }
|
|
};
|
|
#endif
|
|
|
|
} // namespace random_internal
|
|
ABSL_NAMESPACE_END
|
|
} // namespace absl
|
|
|
|
#endif // ABSL_RANDOM_INTERNAL_WIDE_MULTIPLY_H_
|