xoshiro/xoshiro_8h_source.html

#pragma once

// SPDX-FileCopyrightText:  2023 Nessan Fitzmaurice <nessan.fitzmaurice@me.com>

// SPDX-License-Identifier: MIT


#include <algorithm>

#include <array>

#include <bit>

#include <cassert>

#include <chrono>

#include <concepts>

#include <cstdint>

#include <format>

#include <iterator>

#include <limits>

#include <ostream>

#include <random>

#include <ranges>

#include <stdexcept>

#include <string>

#include <type_traits>

#include <vector>


// If the `gf2` library is available, we provide extra methods---primarily for analysing new RNG variants.

// For normal use, this is not required & the single-header xoshiro.h works fine without it.

#ifdef GF2

    #include <gf2/gf2.h>

#endif


namespace xso {


// --------------------------------------------------------------------------------------------------------------------

// A C++ concept that lets us distinguish standard distribution types from other types.

// --------------------------------------------------------------------------------------------------------------------


template<typename Dist>

concept Distribution = requires { typename Dist::param_type; };


// --------------------------------------------------------------------------------------------------------------------

// Forward declarations of methods defined later in this file.

// --------------------------------------------------------------------------------------------------------------------

template<typename State>

constexpr auto jump_coefficients(std::size_t J, bool J_is_log2 = false);


template<std::unsigned_integral word_type, std::size_t N>

constexpr auto reduce(const std::array<word_type, N>& p, std::size_t J, bool J_is_log2 = false);


// --------------------------------------------------------------------------------------------------------------------

// The xoshiro/xoroshiro pseudorandom number generator class template.

// --------------------------------------------------------------------------------------------------------------------


template<typename State, typename Scrambler>


class generator {

public:


    using state_type = State;


    using scrambler_type = Scrambler;


    using word_type = typename State::word_type;


    using array_type = typename State::array_type;


    static constexpr std::size_t word_count() { return State::word_count(); }


    static constexpr std::size_t bit_count() { return State::bit_count(); }


    static constexpr auto type_string() { return std::format("{} with {}", State::type_string(), Scrambler::type_string()); }


    using result_type = word_type;


    static constexpr result_type min() noexcept { return 0; }


    static constexpr result_type max() noexcept { return std::numeric_limits<result_type>::max(); }


    constexpr generator() { seed(); }


    explicit constexpr generator(word_type s) { seed(s); }


    template<std::input_iterator Iter>

        requires std::convertible_to<std::iter_value_t<Iter>, word_type>


    explicit constexpr generator(Iter b, Iter e) {

        seed(b, e);

    }


    constexpr void seed() {

        // We will use std::random_device as the principal source of entropy.

        std::random_device dev;


        // Fill a full seed array with calls to dev() --  may need a couple of dev() calls to fill one word of state.

        array_type full_state;

        if constexpr (sizeof(word_type) <= sizeof(std::random_device::result_type)) {

            for (auto& word : full_state) word = static_cast<word_type>(dev());

        } else {

            for (auto& word : full_state) word = static_cast<word_type>(static_cast<uint64_t>(dev()) << 32 | dev());

        }


        // However, `std::random_device` may be poor so add data from a call to a high resolution clock for first word.

        using clock_type = std::chrono::high_resolution_clock;

        auto ticks = static_cast<std::uint64_t>(clock_type::now().time_since_epoch().count());


        // From call to call, time ticks only changes in the low order bits -- better scramble things a bit!

        ticks = murmur_scramble64(ticks);


        // Fold the scrambled ticks variable into the first seed word.

        full_state[0] ^= static_cast<word_type>(ticks);


        // Seed the state from our full "high quality" seed array.

        m_state.seed(full_state.cbegin(), full_state.cend());

    }


    constexpr void seed(word_type seed) {

        // Scramble the bits in the single seed we were given.

        auto sm64_state = murmur_scramble64(seed);


        // Use SplitMix64 to at least put some values in all the state words & seed the state.

        array_type full_state;

        for (auto& word : full_state) word = static_cast<word_type>(split_mix64(sm64_state));

        m_state.seed(full_state.cbegin(), full_state.cend());

    }


    template<std::input_iterator Src>

        requires std::convertible_to<std::iter_value_t<Src>, word_type>


    constexpr void seed(Src b, Src e) {

        m_state.seed(b, e);

    }


    constexpr void step() { m_state.step(); }


    constexpr result_type operator()() {

        result_type result = m_scrambler(m_state);

        step();

        return result;

    }


    constexpr word_type operator[](std::size_t i) const { return m_state[i]; }


    template<std::output_iterator<word_type> Dst>


    constexpr void get_state(Dst dst) const {

        m_state.get_state(dst);

    }


    template<std::integral T>


    constexpr T sample(T a, T b) {

        return std::uniform_int_distribution<T>{a, b}(*this);

    }


    template<std::floating_point T>


    constexpr T sample(T a, T b) {

        return std::uniform_real_distribution<T>{a, b}(*this);

    }


    template<std::integral T>


    constexpr T index(T len) {

        return sample(T{0}, len - 1);

    }


    template<std::input_iterator T>


    constexpr auto sample(T b, T e) {

        // Edge case?

        auto len = std::distance(b, e);

        if (len < 2) return *b;


        // Pick an index inside the iteration at random & return the corresponding value.

        auto i = index(len);

        std::advance(b, i);

        return *b;

    }


    template<typename Container>

        requires std::ranges::input_range<const Container> && std::ranges::common_range<const Container>


    constexpr auto sample(const Container& container) {

        return sample(std::ranges::cbegin(container), std::ranges::cend(container));

    }


    template<std::input_iterator Src, std::output_iterator<std::iter_value_t<Src>> Dst>


    constexpr Dst sample(Src b, Src e, Dst dst, std::size_t n) {

        return std::sample(b, e, dst, n, *this);

    }


    template<typename Src, std::output_iterator<std::ranges::range_value_t<const Src>> Dst>

        requires std::ranges::input_range<const Src> && std::ranges::common_range<const Src>


    constexpr auto sample(const Src& src, Dst dst, std::size_t n) {

        return sample(std::ranges::cbegin(src), std::ranges::cend(src), dst, n);

    }


    constexpr auto sample(Distribution auto& dist) { return dist(*this); }


    template<typename Dst>


    constexpr Dst sample(Distribution auto& dist, Dst dst, std::size_t n) {

        while (n-- != 0) *dst++ = dist(*this);

        return dst;

    }


    constexpr std::size_t roll(std::size_t n_sides = 6) { return sample(1uz, n_sides); }


    constexpr bool flip(double p = 0.5) { return std::bernoulli_distribution{p}(*this); }


    template<std::random_access_iterator Iter>


    constexpr void shuffle(Iter b, Iter e) {

        std::shuffle(b, e, *this);

    }


    template<typename Container>

        requires std::ranges::random_access_range<Container> && std::ranges::common_range<Container>


    constexpr void shuffle(Container& container) {

        return shuffle(std::begin(container), std::end(container));

    }


    void discard(std::uint64_t z) {

        for (std::uint64_t i = 0; i < z; ++i) step();

    }


    constexpr auto jump(std::size_t n, bool n_is_log2 = false) {

        // Get the jump polynomial coefficients for this jump

        auto jump_coeffs = xso::jump_coefficients<state_type>(n, n_is_log2);


        // Perform the jump using those coefficients

        jump(jump_coeffs);


        // Return the jump polynomial coefficients to the caller for possible reuse later.

        return jump_coeffs;

    }


    constexpr void jump(const array_type& jump_coefficients) {


        // Constant

        constexpr std::size_t bits_per_word = std::numeric_limits<word_type>::digits;


        // lambda: `is_set(word, b)` returns true if bit `b` in `word` is set.

        auto is_set = [=](const word_type word, std::size_t b) -> bool {

            return word & static_cast<word_type>(word_type{1} << b);

        };


        // If the current state is `s` and the state's transition matrix is T then the jump we want is s <- (T^n).s.

        // Cayley-Hamilton is invoked to equate T^n with a small polynomial sum r(T) where r(x) = x^n mod c(x)

        // and c(x) is the characteristic polynomial for T. Thus (T^n).s == r(T).s which is doable.

        //

        // The `jump_coefficients` argument is assumed to have the coefficients of r(x) stored compactly in words.

        // The next loop computes the sum r(T).s = r_0.s + r_1.s^1 + ... + r_{n-1} s^{n-1}.

        // We compute s^{i+1} = T.s^i using the step() method (so s <- T.s <- (T^2).s by iteratively stepping s

        // forward).

        array_type sum;

        sum.fill(0);

        for (auto i = 0uz; i < word_count(); ++i) {


            // Iterate over the bits in each coefficient word -- the bits are the coefficients of r(x).

            word_type r_word = jump_coefficients[i];

            for (auto b = 0uz; b < bits_per_word; ++b) {

                if (is_set(r_word, b)) {

                    // This coefficient in r(x) is one, so contributes to the sum ...

                    for (auto w = 0uz; w < word_count(); ++w) sum[w] ^= m_state[w];

                }

                // Compute the next state s^{i+1} by calling the step() method (same as s <- T.s).

                m_state.step();

            }

        }


        // Store the computed jumped state back as our current state so we are ready to proceed from there ...

        m_state.seed(sum.cbegin(), sum.cend());

    }


    template<std::output_iterator<word_type> Dst>


    static constexpr void characteristic_coefficients(Dst dst) {

        State::characteristic_coefficients(dst);

    }


    static constexpr auto characteristic_coefficients() {

        array_type result;

        State::characteristic_coefficients(result.begin());

        return result;

    }


#ifdef GF2


    void jump(gf2::BitPolynomial<word_type> const& jump_poly) {

        array_type sum;


        // Computing [r_0 + r_1 T + ... + r_{m-1} T^{m-1}].s where s is the current state and r is the jump polynomial.

        // T is the state's transition matrix so we can compute s^{i+1} = T.s^i using the step() method.

        sum.fill(0);

        for (auto i = 0uz; i < jump_poly.size(); ++i) {

            if (jump_poly[i])

                for (std::size_t w = 0; w < word_count(); ++w) sum[w] ^= m_state[w];

            m_state.step();

        }


        // Perform the computed jump by reseeding the state from the computed sum ...

        m_state.seed(sum.cbegin(), sum.cend());

    }


#endif


private:

    State     m_state;

    Scrambler m_scrambler;


    // Class method that is an implementation of the SplitMix64 random number generator -- a simple generator with 64

    // bits of state.

    //

    // Used here to help seed our more complex generators from a single 64-bit seed value.

    static constexpr std::uint64_t split_mix64(std::uint64_t& state) {

        std::uint64_t z = (state += 0x9e3779b97f4a7c15);

        z = (z ^ (z >> 30)) * 0xbf58476d1ce4e5b9;

        z = (z ^ (z >> 27)) * 0x94d049bb133111eb;

        z = (z ^ (z >> 31));

        return z;

    };


    // Class method that returns a 64-bit word that is a scrambled version of the input 64-bit value.

    //

    // This is based on the MurmurHash3 finalizer function.

    static constexpr std::uint64_t murmur_scramble64(std::uint64_t x) {

        x ^= x >> 33;

        x *= 0xff51afd7ed558ccdL;

        x ^= x >> 33;

        x *= 0xc4ceb9fe1a85ec53L;

        x ^= x >> 33;

        return x;

    }


    // Class method that returns a 32-bit word that is a scrambled version of the input 32-bit value.

    //

    // This is based on the MurmurHash3 mix function.

    static constexpr std::uint32_t murmur_scramble32(std::uint32_t x) {

        x *= 0xcc9e2d51;

        x = (x << 15) | (x >> 17);

        x *= 0x1b873593;

        return x;

    }

};


// --------------------------------------------------------------------------------------------------------------------

// The Xoshiro state:

// --------------------------------------------------------------------------------------------------------------------


template<std::size_t N, std::unsigned_integral T, std::uint8_t A, std::uint8_t B>


class xoshiro {

public:

    using word_type = T;


    using array_type = std::array<T, N>;


    static constexpr std::size_t word_count() { return N; }


    static constexpr std::size_t bit_count() { return N * std::numeric_limits<T>::digits; }


    static constexpr auto type_string() {

        return std::format("xoshiro<{}x{},{},{}>", N, std::numeric_limits<T>::digits, A, B);

    }


    constexpr T operator[](std::size_t i) const { return m_state[i]; }


    template<std::output_iterator<word_type> Dst>


    constexpr void get_state(Dst dst) const {

        std::copy(m_state.cbegin(), m_state.cend(), dst);

    }


    template<std::input_iterator Src>

        requires std::convertible_to<std::iter_value_t<Src>, word_type>


    constexpr void seed(Src b, Src e) {

        std::copy(b, e, m_state.begin());

    }


    constexpr void step() {

        if constexpr (N == 4) {

            auto tmp = m_state[1] << A;

            m_state[2] ^= m_state[0];

            m_state[3] ^= m_state[1];

            m_state[1] ^= m_state[2];

            m_state[0] ^= m_state[3];

            m_state[2] ^= tmp;

            m_state[3] = std::rotl(m_state[3], B);

        } else if constexpr (N == 8) {

            auto tmp = m_state[1] << A;

            m_state[2] ^= m_state[0];

            m_state[5] ^= m_state[1];

            m_state[1] ^= m_state[2];

            m_state[7] ^= m_state[3];

            m_state[3] ^= m_state[4];

            m_state[4] ^= m_state[5];

            m_state[0] ^= m_state[6];

            m_state[6] ^= m_state[7];

            m_state[6] ^= tmp;

            m_state[7] = std::rotl(m_state[7], B);

        } else {

            // Get a useful'ish error message by pumping a deliberately false condition into static_assert(...).

            static_assert(N < 0, "No xoshiro step() implementation for this number of words of state!");

        }

    }


    template<std::output_iterator<word_type> Dst>


    static constexpr void characteristic_coefficients(Dst dst) {

        // In practice we have precomputed the p(x) polynomial for just a few xoshiro's with specific parameters.

        if constexpr (std::is_same_v<T, uint32_t> && N == 4 && A == 9 && B == 11) {

            std::array<T, N> p = {0xde18fc01, 0x1b489db6, 0x6254b1, 0xfc65a2};

            std::copy(p.cbegin(), p.cend(), dst);

        } else if constexpr (std::is_same_v<T, uint64_t> && N == 4 && A == 17 && B == 45) {

            std::array<T, N> p = {0x9d116f2bb0f0f001, 0x280002bcefd1a5e, 0x4b4edcf26259f85, 0x3c03c3f3ecb19};

            std::copy(p.cbegin(), p.cend(), dst);

        } else if constexpr (std::is_same_v<T, uint64_t> && N == 8 && A == 11 && B == 21) {

            std::array<T, N> p = {0xcf3cff0c00000001, 0x7fdc78d886f00c63, 0xf05e63fca6d7b781, 0x7a67058e7bbab6f0,

                                  0xf11eef832e32518f, 0x51ba7c47edc758ad, 0x8f2d27268ce4b20b, 0x500055d8b77f};

            std::copy(p.cbegin(), p.cend(), dst);

        } else {

            throw std::invalid_argument("xoshiro characteristic polynomial not pre-computed for given parameters!");

        }

    }


    static constexpr auto characteristic_coefficients() {

        array_type result;

        characteristic_coefficients(result.begin());

        return result;

    }


private:

    std::array<T, N> m_state = {1};

};


// --------------------------------------------------------------------------------------------------------------------

// The Xoroshiro State:

// --------------------------------------------------------------------------------------------------------------------


template<std::size_t N, std::unsigned_integral T, std::uint8_t A, std::uint8_t B, std::uint8_t C>


class xoroshiro {

public:

    using word_type = T;


    using array_type = std::array<T, N>;


    static constexpr std::size_t word_count() { return N; }


    static constexpr std::size_t bit_count() { return N * std::numeric_limits<T>::digits; }


    static constexpr auto type_string() {

        return std::format("xoroshiro<{}x{},{},{},{}>", N, std::numeric_limits<T>::digits, A, B, C);

    }


    constexpr T operator[](std::size_t i) const { return m_state[(i + m_final + 1) % N]; }


    template<std::output_iterator<word_type> Dst>


    constexpr void get_state(Dst dst) const {

        for (auto i = 0uz; i < N; ++i, ++dst) *dst = operator[](i);

    }


    template<std::input_iterator Src>

        requires std::convertible_to<std::iter_value_t<Src>, word_type>


    constexpr void seed(Src b, Src e) {

        std::copy(b, e, m_state.begin());


        // Reset the ring buffer final index

        m_final = N - 1;

    }


    constexpr void step() {

        // Depending on the size of `N` we either do an explicit or implicit array shuffle of the state array.

        if constexpr (N == 2)

            simple_step();

        else

            clever_step();

    }


    template<std::output_iterator<word_type> Dst>


    static constexpr void characteristic_coefficients(Dst dst) {

        if constexpr (std::is_same_v<T, uint32_t> && N == 2 && A == 26 && B == 9 && C == 13) {

            std::array<T, N> p = {0x6e2286c1, 0x53be9da};

            std::copy(p.cbegin(), p.cend(), dst);

        } else if constexpr (std::is_same_v<T, uint64_t> && N == 2 && A == 24 && B == 16 && C == 37) {

            std::array<T, N> p = {0x95b8f76579aa001, 0x8828e513b43d5};

            std::copy(p.cbegin(), p.cend(), dst);

        } else if constexpr (std::is_same_v<T, uint64_t> && N == 2 && A == 49 && B == 21 && C == 28) {

            std::array<T, N> p = {0x8dae70779760b081, 0x31bcf2f855d6e5};

            std::copy(p.cbegin(), p.cend(), dst);

        } else if constexpr (std::is_same_v<T, uint64_t> && N == 16 && A == 25 && B == 27 && C == 36) {

            std::array<T, N> p = {0x5cfeb8cc48ddb211, 0xb73e379d035a06dd, 0x17d5100a20a0350e, 0x7550223f68f98cac,

                                  0x29d373b5c5ed3459, 0x3689b412ef70de48, 0xa1d3b6ee079a7cc6, 0x9bf0b669abd100f8,

                                  0x955c84e105f60997, 0x6ca140c61889cddd, 0xabaf68c5fc3a0e4a, 0xa46134526b83adc5,

                                  0x710704d05683d63,  0x580d080b44b606a2, 0x8040a0580158a1,   0x800081};

            std::copy(p.cbegin(), p.cend(), dst);

        } else {

            throw std::invalid_argument("xoroshiro characteristic polynomial not pre-computed for given parameters!");

        }

    }


    static constexpr auto characteristic_coefficients() {

        array_type result;

        characteristic_coefficients(result.begin());

        return result;

    }


private:

    std::array<T, N> m_state = {1};   // The state is an array of words -- should never be all zeros!

    std::size_t      m_final = N - 1; // Current location of the final word of state.


    constexpr void simple_step() {

        // Capture the current values in the first and final words of state

        T s0 = m_state[0];

        T s1 = m_state[N - 1];


        // Shift most of the words of state down one slot

        // Note: It could help to unroll this loop at least once for larger N but the shuffle indices method is

        // better

        for (auto i = 0uz; i < N - 2; ++i) m_state[i] = m_state[i + 1];


        // Update the first and final words of state

        s1 ^= s0;

        m_state[N - 2] = std::rotl(s0, A) ^ (s1 << B) ^ s1;

        m_state[N - 1] = std::rotl(s1, C);

    }


    constexpr void clever_step() {

        // Which indices point to the current final & first words of state

        std::size_t i_final = m_final;

        std::size_t i_first = (m_final + 1) % N;


        // Capture the current values in the final & first words of state

        T s_final = m_state[i_final];

        T s_first = m_state[i_first];


        // Update the values for the final & first words of state

        s_final ^= s_first;

        m_state[i_final] = std::rotl(s_first, A) ^ (s_final << B) ^ s_final;

        m_state[i_first] = std::rotl(s_final, C);


        // Step the index of the final word of state -- this shuffles the state array down a slot.

        m_final = i_first;

    }

};


// --------------------------------------------------------------------------------------------------------------------

// The Scramblers:

//

// A Scrambler is a functor that is passed a State and returns a single unsigned output word.

// --------------------------------------------------------------------------------------------------------------------


template<auto S, std::size_t w = 0>


struct star {

    constexpr auto operator()(const auto& state) const { return S * state[w]; }


    static constexpr auto type_string() { return std::format("star<{:x},{}>", S, w); }

};


template<auto S, auto R, auto T, std::size_t w = 0>


struct star_star {

    constexpr auto operator()(const auto& state) const { return T * std::rotl(S * state[w], R); }


    static constexpr auto type_string() { return std::format("star_star<{:x},{},{:x},{}>", S, R, T, w); }

};


template<std::size_t w0 = 0, std::size_t w1 = 1>


struct plus {

    constexpr auto operator()(const auto& state) const { return state[w0] + state[w1]; }


    static constexpr auto type_string() { return std::format("plus<{},{}>", w0, w1); }

};


template<auto R, std::size_t w0, std::size_t w1>


struct plus_plus {

    constexpr auto operator()(const auto& state) const { return std::rotl(state[w0] + state[w1], R) + state[w0]; }


    static constexpr auto type_string() { return std::format("plus_plus<{},{},{}>", R, w0, w1); }

};


// --------------------------------------------------------------------------------------------------------------------

// Type aliases for all 17 generators discussed in the Black & Vigna paper

// --------------------------------------------------------------------------------------------------------------------


// clang-format off

// The analysed versions of the xoshiro engine with specific choices for A & B:

using xoshiro_4x32              = xoshiro<4, uint32_t, 9,  11>;

using xoshiro_4x64              = xoshiro<4, uint64_t, 17, 45>;

using xoshiro_8x64              = xoshiro<8, uint64_t, 11, 21>;


// The analysed versions of the xoshiro engine with specific choices for A, B & C:

using xoroshiro_2x32            = xoroshiro<2,  uint32_t, 26, 9,  13>;

using xoroshiro_2x64            = xoroshiro<2,  uint64_t, 24, 16, 37>;

using xoroshiro_2x64b           = xoroshiro<2,  uint64_t, 49, 21, 28>;  // Alternative for 2x64 case

using xoroshiro_16x64           = xoroshiro<16, uint64_t, 25, 27, 36>;


// The analyzed versions of the xoshiro generators:

using xoshiro_4x32_plus         = generator<xoshiro_4x32, plus<0, 3>>;

using xoshiro_4x32_plus_plus    = generator<xoshiro_4x32, plus_plus<7, 0, 3>>;

using xoshiro_4x32_star_star    = generator<xoshiro_4x32, star_star<5, 7, 9, 1>>;

using xoshiro_4x64_plus         = generator<xoshiro_4x64, plus<0, 3>>;

using xoshiro_4x64_plus_plus    = generator<xoshiro_4x64, plus_plus<23, 0, 3>>;

using xoshiro_4x64_star_star    = generator<xoshiro_4x64, star_star<5, 7, 9, 1>>;

using xoshiro_8x64_plus         = generator<xoshiro_8x64, plus<2, 0>>;

using xoshiro_8x64_plus_plus    = generator<xoshiro_8x64, plus_plus<17, 2, 0>>;

using xoshiro_8x64_star_star    = generator<xoshiro_8x64, star_star<5, 7, 9, 1>>;


// The analysed versions of the xoroshiro generators:

using xoroshiro_2x32_star       = generator<xoroshiro_2x32,  star<0x9E3779BB, 0>>;

using xoroshiro_2x32_star_star  = generator<xoroshiro_2x32,  star_star<0x9E3779BB, 5, 5, 0>>;

using xoroshiro_2x64_plus       = generator<xoroshiro_2x64,  plus<0, 1>>;

using xoroshiro_2x64_plus_plus  = generator<xoroshiro_2x64b, plus_plus<17, 0, 1>>;

using xoroshiro_2x64_star_star  = generator<xoroshiro_2x64,  star_star<5, 7, 9, 0>>;

using xoroshiro_16x64_plus_plus = generator<xoroshiro_16x64, plus_plus<23, 15, 0>>;

using xoroshiro_16x64_star      = generator<xoroshiro_16x64, star<0x9e3779b97f4a7c13, 0>>;

using xoroshiro_16x64_star_star = generator<xoroshiro_16x64, star_star<5, 7, 9, 0>>;

// clang-format on


using rng32 = xoshiro_4x32_star_star;


using rng64 = xoshiro_4x64_star_star;


using rng = rng64;


// --------------------------------------------------------------------------------------------------------------------

// Partitions of random number stream:

//

// For parallel processing applications it can be useful to split a single random number stream into a number of

// non-overlapping "partitions". Then different computational threads can get their "own set" of random numbers without

// worrying about stream overlaps etc.

//

// The partitions need to be very large so this only works for States where we can jump far ahead in an efficient way.

// --------------------------------------------------------------------------------------------------------------------


template<typename RNG>


class partition {

public:


    partition(const RNG& rng, std::size_t n_partitions) : m_rng{rng} {

        // Make sure the requested number of partitions makes sense -- silently fix any issues.

        if (n_partitions == 0) n_partitions = 1;


        // How many bits of state in the RNG type?

        auto n_bits = RNG::bit_count();


        // The period of the generator is `2^n_bits` so each partition ideally has size `2^n_bits / n_partitions`.

        // That number will probably overflow a std::size_t so we must instead keep everything in log 2 form.

        // First we find the smallest `n` such that `2^n >= n_partitions - 1`.

        // Note if `n_partitions` is 128 the following gives `n = 7` and does the same if `n = 100`.

        auto n = static_cast<std::size_t>(std::bit_width(n_partitions - 1));


        // We will create `2^n` partitions which is probably more than needed but the wastage is negligible.

        // To create those `2^n` partitions we must be able to jump ahead `2^(n_bits - n)` steps many times.

        auto power_2 = n_bits - n;


        // Precompute the jump coefficients to advance the generator `2^power_2` steps i.e. along to the next partition.

        m_jump_coefficients = xso::jump_coefficients<typename RNG::state_type>(power_2, true);

    }


    RNG next() {

        // We already have a pre-baked generator seeded at the right spot ready to go.

        RNG result = m_rng;


        // Prep for the next call by jumping the parent copy once more along its stream.

        m_rng.jump(m_jump_coefficients);


        // And return the pre-baked one ...

        return result;

    }


private:

    using array_type = typename RNG::array_type;


    RNG        m_rng;

    array_type m_jump_coefficients;

};


// --------------------------------------------------------------------------------------------------------------------

// Non-member functions for computing jump polynomials:

// --------------------------------------------------------------------------------------------------------------------


template<typename State>

constexpr auto


jump_coefficients(std::size_t n, bool n_is_log2) {


    // Retrieve the low order coefficients of characteristic polynomial --- this can throw if not precomputed.

    std::array<typename State::word_type, State::word_count()> char_coefficients;

    State::characteristic_coefficients(char_coefficients.begin());


    // The jump polynomial is x^J mod c(x) -- that computation expects to be handed p(x) where c(x) = x^n + p(x).

    return xso::reduce(char_coefficients, n, n_is_log2);

}


// --------------------------------------------------------------------------------------------------------------------

// We have some "internal" functions that reduce x^J mod c(x) --- needed for the jump polynomial computations.

// These re-implement a more general reduction method in the gf2::BitPolynomial class (https://nessan/github.io/gf2/).

// Repeated here to make `xoshiro.h` self-contained.

//

// Not part of the public API but used for the jump calculations in the generator class.

// --------------------------------------------------------------------------------------------------------------------


// Function to "riffle" a `src` word into two other words `lo` and `hi` containing the bits from `src`

// interleaved with zeros.

//

// So the 8-bit word `abcdefgh` fills `lo` as `a0b0c0d0` and `hi` as  `e0f0g0h0`.

//

// # Example

// ```

// std::uint8_t src = 0b1111'1111;

// std::uint8_t lo, hi;

// xso::riffle(src, lo, hi);

// assert_eq(lo, 0b01010101, "lo is {:08b}", lo);

// assert_eq(hi, 0b01010101, "hi is {:08b}", hi);

// ```

// *NOTE:** This function is "public" for testing purposes only -- it is not part of the normal interface.

template<std::unsigned_integral word_type>

constexpr void

riffle(word_type src, word_type& lo, word_type& hi) {

    // Constants

    constexpr std::size_t bits_per_word = std::numeric_limits<word_type>::digits;

    constexpr std::size_t half_bits = bits_per_word / 2;

    constexpr word_type   one{1};

    constexpr word_type   ones = std::numeric_limits<word_type>::max();


    // Split the src into lo and hi halves.

    lo = src & (ones >> half_bits);

    hi = src >> half_bits;


    // Some magic to interleave the respective halves with zeros.

    for (auto i = bits_per_word / 4; i > 0; i /= 2) {

        word_type div = word_type(one << i) | one;

        word_type msk = ones / div;

        lo = (lo ^ (lo << i)) & msk;

        hi = (hi ^ (hi << i)) & msk;

    }

}


// Function that riffles a `src` array of unsigneds into two others `lo` and `hi` which will be filled with the

// bits from `src` interleaved with zeros.

//

// We treat `lo` and `hi` as contiguous storage and fill the elements of `lo` first and then `hi`.

// This allows us to optionally reuse `src` for the output array `lo` -- the call `riffle(src, src, hi)` will work.

//

// # Example

// ```

// std::array<std::uint8_t, 2> src = {0b1111'1111, 0b1111'1111};

// std::array<std::uint8_t, 2> lo, hi;

// xso::riffle(src, lo, hi);

// assert_eq(lo, (std::array<std::uint8_t, 2>{0b01010101, 0b01010101}));

// assert_eq(hi, (std::array<std::uint8_t, 2>{0b01010101, 0b01010101}));

// ```

// *NOTE:** This function is "public" for testing purposes only -- it is not part of the normal interface.

template<std::unsigned_integral word_type, std::size_t N>

static constexpr void

riffle(const std::array<word_type, N>& src, std::array<word_type, N>& lo, std::array<word_type, N>& hi) {

    // We will riffle each word in src into two other words x & y

    word_type x, y;


    // We work through `src` in reverse order -- this allows the reuse of `src` for `lo`!

    // Treating [lo|hi] as contiguous storage, first working back through hi and then back through lo.

    for (std::size_t i = N; i-- > 0;) {

        riffle(src[i], x, y);

        if (2 * i + 1 > N) {

            // Both x & y go in hi -- note that if 2i + 1 - N > 0 then 2i - N is >= 0.

            hi[2 * i - N] = x;

            hi[2 * i + 1 - N] = y;

        } else if (2 * i + 1 == N) {

            // Straddling situation where y goes in the first word of hi and x in the last word of lo.

            lo[N - 1] = x;

            hi[0] = y;

        } else {

            // Need to pop both x & y into the lo array.

            lo[2 * i] = x;

            lo[2 * i + 1] = y;

        }

    }

}


// Function that computes r(x) = x^e mod c(x) in GF(2) where e = J or 2^J and J is an unsigned integer argument.

//

// The polynomial c(x) is monic of degree n so c(x) = x^n + p(x) where p(x) is a polynomial of degree less than n.

// We are passed the n coefficients of p(x) packed into an array of unsigned integers.

// We return the coefficients of r(x) = x^e mod c(x) packed into an array of unsigned integers in the same format.

//

// # Note

// Any linting tool you use will (reasonably) complain that the complexity of this method is too high!

// The method is a direct re-implementation of the `gf2::BitPolynomial::reduce` method which is also complex but

// easier to understand as it is properly factored. The version here is is less general as it assumes that the

// degree of p(x) is a multiple of 32.

//

// *NOTE:** This method "public" for testing purposes only -- it is not part of the normal interface.

template<std::unsigned_integral word_type, std::size_t N>

constexpr auto

reduce(const std::array<word_type, N>& p, std::size_t J, bool J_is_log2) {


    // We will return the coefficients of r(x) = x^e mod c(x) packed into an array of unsigned integers of this type.

    using array_type = std::array<word_type, N>;


    // Constant we use to indicate "no such position"/"not found" and a couple of others.

    constexpr auto      npos = static_cast<std::size_t>(-1);

    constexpr word_type one{1};


    // The polynomial c(x) = x^n + p(x) where p(x) = p_0 + p_1 x + ... + p_{n-1} x^{n-1} and n is:

    constexpr std::size_t bits_per_word = std::numeric_limits<word_type>::digits;

    constexpr std::size_t n = N * bits_per_word;


    // lambda: Returns the index of the word that holds p_i.

    auto word = [=](std::size_t i) { return i / bits_per_word; };


    // lambda: Returns the bit location of p_i inside the word that holds it.

    auto bit = [=](std::size_t i) { return i % bits_per_word; };


    // lambda: Returns a mask that isolates p_i within the word that holds it.

    auto mask = [=](std::size_t i) { return word_type{one << bit(i)}; };


    // lambda: Returns true if poly_i is 1.

    auto test = [=](const auto& poly, std::size_t i) -> bool { return poly[word(i)] & mask(i); };


    // lambda: Sets poly_i to 1.

    auto set = [=](auto& poly, std::size_t i) { poly[word(i)] |= mask(i); };


    // lambda: Returns the index for the least significant set bit in the argument or `npos` if none set.

    auto lsb = [=](word_type w) { return w == 0 ? npos : static_cast<std::size_t>(std::countr_zero(w)); };


    // lambda: Returns the index for the most significant set bit in the argument or `npos` if none set.

    auto msb = [=](word_type w) { return static_cast<std::size_t>(std::bit_width(w) - 1); };


    // lambda: Returns the first set coefficient in poly or `npos` if the coefficients are all zero.

    auto first_set = [=](const auto& poly) {

        for (auto i = 0uz; i < N; ++i)

            if (poly[i] != 0) return i * bits_per_word + lsb(poly[i]);

        return npos;

    };


    // lambda: Returns the final set coefficient in poly or `npos` if the coefficients are all zero.

    auto final_set = [=](const auto& poly) {

        std::size_t i = N;

        while (i--)

            if (poly[i] != 0) return i * bits_per_word + msb(poly[i]);

        return npos;

    };


    // lambda: Returns true if the highest coefficient in `poly` is set (then poly is said to be monic).

    auto monic = [=](const auto& poly) {

        constexpr std::size_t complement = bits_per_word - 1;

        constexpr auto        final_bit_mask = word_type{one << complement};

        return poly[N - 1] & final_bit_mask;

    };


    // lambda: Computes lhs <- lhs + rhs which in GF(2) is equivalent to  lhs <- lhs^rhs.

    auto add = [=](auto& lhs, const auto& rhs) {

        for (auto i = 0uz; i < N; ++i) lhs[i] ^= rhs[i];

    };


    // lambda: Performs a one place shift on the polynomial coefficients stored poly.

    // Shift is to the the right if you think the elements are in vector order [p0,p1,p2,p3] -> [0,p0,p1,p2].

    // Shift is to the left when you think in bit order [b3,b2,b1,b0] -> [b2,b1,b0,0].

    auto shift = [=](auto& poly) {

        constexpr std::size_t complement = bits_per_word - 1;

        for (std::size_t i = N - 1; i > 0; --i) {

            auto l = static_cast<word_type>(poly[i] << 1);

            auto r = static_cast<word_type>(poly[i - 1] >> complement);

            poly[i] = l | r;

        }

        poly[0] <<= 1;

    };


    // lambda: If degree[poly] < n, this performs poly(x) <- x*poly(x) mod c(x) where c(x) = x^n + p(x).

    auto times_x_step = [&](auto& poly) {

        bool add_p = monic(poly);

        shift(poly);

        if (add_p) add(poly, p);

    };


    // We precompute x^{n + i} mod c(x) for i = 0, ..., n-1 starting from the known x^n mod c(x) = p.

    // Each x^{n + i} mod c(x) is a word-vector of coefficients and we put the lot into a std::vector.

    std::vector<array_type> power_mod(n);

    power_mod[0] = p;

    for (std::size_t i = 1; i < n; ++i) {

        power_mod[i] = power_mod[i - 1];

        times_x_step(power_mod[i]);

    }


    // Some work space we use below.

    array_type hi;


    // lambda: If degree[poly] < n, performs: poly(x) <- poly(x)^2 mod c(x) where as usual c(x) = x^n + p(x).

    auto square_step = [&](auto& poly) {

        // Compute poly(x)^2 -- in GF(2) this means interspersing all the coefficients with zeros.

        // We actually riffle poly directly into two arrays lo & hi so that poly(x)^2 = lo(x) + x^n hi(x).

        // This only works because we assume n some multiple of N (i.e. all bits in poly matter).

        // NOTE: Our riffle method above for arrays lets us reuse the poly array for lo.

        riffle(poly, poly, hi);


        // poly(x)^2 mod c(x) now is poly(x) + x^n hi(x) mod c(x) as degree[poly] < n.

        // Add the x^n hi(x) mod c(x) term-by-term noting that at most every second term in hi(x) is 1.

        auto hi_first = first_set(hi);

        if (hi_first != npos) {

            auto hi_final = final_set(hi);

            for (std::size_t i = hi_first; i <= hi_final; i += 2)

                if (test(hi, i)) add(poly, power_mod[i]);

        }

    };


    // Initialize our return value to all zeros.

    array_type result;

    result.fill(0);


    // Case: e = 2^J -- we just do J squaring steps starting from r(x) = x to get to  x^(2^J) mod c(x).

    if (J_is_log2) {

        set(result, 1);

        for (std::size_t j = 0; j < J; ++j) square_step(result);

        return result;

    }


    // Case e = J < n: Then x^J mod c(x) = x^J so we can set the appropriate coefficient in r and return.

    if (J < n) {

        set(result, J);

        return result;

    }


    // Case e = J = n: Then x^J mod c(x) = p(x).

    if (J == n) return p;


    // Case e = J > n: We use a square & multiply algorithm:

    // Note that if e.g. J = 0b00010111 then std::bit_floor(J) = 0b00010000.

    std::size_t J_bit = std::bit_floor(J);


    // Start with r(x) = x mod c(x) which takes care of the most significant binary digit in J.

    set(result, 1);

    J_bit >>= 1;


    // And off we go ...

    while (J_bit) {


        // Always do a square step and then a times_x step if necessary (i.e. if current bit in J is set).

        square_step(result);

        if (J & J_bit) times_x_step(result);


        // On to the next bit position in n.

        J_bit >>= 1;

    }

    return result;

}


#ifdef GF2


// --------------------------------------------------------------------------------------------------------------------

// Non-member functions that are only defined if we have access to the `gf2` library.

// See https://nessan.github.io/gf2/ for tools for working with polynomials and matrices over GF(2).

// --------------------------------------------------------------------------------------------------------------------


template<typename State>

auto


transition_matrix() {


    using word_type = typename State::word_type;


    // Some constants for our state size.

    constexpr auto n_words = State::word_count();

    constexpr auto n_bits = State::bit_count();


    // The transition matrix will be a square n_bits x n_bits matrix over GF(2).

    gf2::BitMatrix<word_type> result{n_bits, n_bits};


    // Some work-space in word and bit space

    gf2::BitVector<word_type>      bits{n_bits};

    std::array<word_type, n_words> words;


    // Create an State instance we will use to step through unit states.

    State state;


    // We get the columns of the transition matrix by looking  at the action of `step()` on all the unit states.

    for (std::size_t k = 0; k < n_bits; ++k) {


        // Create the k'th unit state (i.e. the state just has the k'th bit set and all others are zero)

        bits.set_all(false);

        bits.set(k, true);


        // Translate that unit bit-vector into an array of words.

        bits.to_words(words.begin());


        // Seed the state from those words.

        state.seed(words.cbegin(), words.cend());


        // Advance the state by one step.

        state.step();


        // Translate the new state to bit-space.

        for (auto i = 0uz; i < n_words; ++i) bits.set_word(i, state[i]);


        // Store those bits into column `k` of the transition matrix.

        // NOTE:  Columnar access for a gf2::BitMatrix must be done element by element.

        for (auto i = 0uz; i < n_bits; ++i) result(i, k) = bits[i];

    }


    return result;

}


template<typename State>

auto


characteristic_polynomial() {

    auto T = xso::transition_matrix<State>();

    return T.characteristic_polynomial();

}


template<typename State>

auto


jump_polynomial(gf2::BitPolynomial<typename State::word_type> const& c, std::size_t N, bool N_is_log2 = false) {

    return c.reduce_x_to_the(N, N_is_log2);

}


#endif


} // namespace xso


// --------------------------------------------------------------------------------------------------------------------

// Formatting and output stream support for our generators:

// --------------------------------------------------------------------------------------------------------------------


// A concept that matches any type that has an accessible `type_string()` class `method.

template<typename T>

concept has_type_string_class_method = requires {

    { T::type_string() } -> std::convertible_to<std::string>;

};


template<has_type_string_class_method T>


struct std::formatter<T> {


    constexpr auto parse(const std::format_parse_context& ctx) {

        auto it = ctx.begin();

        assert(it == ctx.end() || *it == '}');

        return it;

    }


    template<class FormatContext>


    auto format(const T&, FormatContext& ctx) const {

        return std::format_to(ctx.out(), "{}", T::type_string());

    }


};


template<has_type_string_class_method T>


std::ostream&

operator<<(std::ostream& s, const T&) {

    s << T::type_string();

    return s;

}


xso::generator
A pseudorandom number generator combining a State and a Scrambler.
Definition xoshiro.h:69

xso::generator::type_string
static constexpr auto type_string()
Class method that returns a name for this type of generator — combining State and Scrambler names.
Definition xoshiro.h:114

xso::generator::max
static constexpr result_type max() noexcept
Returns the largest value this generator can produce.
Definition xoshiro.h:147

xso::generator::operator[]
constexpr word_type operator[](std::size_t i) const
Returns the i'th state word.
Definition xoshiro.h:313

xso::generator::jump
constexpr void jump(const array_type &jump_coefficients)
Efficiently jumps the generator's state forward by J steps where J can be huge (e....
Definition xoshiro.h:671

xso::generator::array_type
typename State::array_type array_type
A convenience container type to hold the full state of this generator, jump polynomial coefficients,...
Definition xoshiro.h:84

xso::generator::step
constexpr void step()
Advances the state by one step.
Definition xoshiro.h:294

xso::generator::min
static constexpr result_type min() noexcept
Returns the smallest value this generator can produce.
Definition xoshiro.h:136

xso::generator::state_type
State state_type
The State used for by generator type – one of the two state classes defined below.
Definition xoshiro.h:75

xso::generator::flip
constexpr bool flip(double p=0.5)
Sampling method that flips a coin, where the probability of getting true is p (defaults to 0....
Definition xoshiro.h:561

xso::generator::roll
constexpr std::size_t roll(std::size_t n_sides=6)
Sampling method that rolls a dice with an arbitrary number of sides (defaults to the usual 6).
Definition xoshiro.h:548

xso::generator::seed
constexpr void seed(Src b, Src e)
Seeds the generator from an iteration of unsigned words which are all copied into the state.
Definition xoshiro.h:285

xso::generator::sample
constexpr Dst sample(Src b, Src e, Dst dst, std::size_t n)
Sampling method that picks n elements without replacement from an iteration [b, e) and puts them in d...
Definition xoshiro.h:460

xso::generator::shuffle
constexpr void shuffle(Container &container)
This method shuffles all the elements of a container.
Definition xoshiro.h:600

xso::generator::generator
constexpr generator()
The default constructor seeds the full underlying state randomly.
Definition xoshiro.h:162

xso::generator::word_count
static constexpr std::size_t word_count()
Class method that returns the number of words of state for this type of generator.
Definition xoshiro.h:92

xso::generator::sample
constexpr Dst sample(Distribution auto &dist, Dst dst, std::size_t n)
Sampling method that takes n samples from a distribution and puts them into a destination iterator.
Definition xoshiro.h:530

xso::generator::seed
constexpr void seed(word_type seed)
Seeds the generator quickly but probably not well from a single unsigned integer value.
Definition xoshiro.h:254

xso::generator::sample
constexpr auto sample(const Src &src, Dst dst, std::size_t n)
Sampling method that picks n elements without replacement from a container and puts them in dst.
Definition xoshiro.h:490

xso::generator::bit_count
static constexpr std::size_t bit_count()
Class method that returns the number of bits of state for this type of generator.
Definition xoshiro.h:100

xso::generator::characteristic_coefficients
static constexpr auto characteristic_coefficients()
Class method that returns the state's precomputed characteristic polynomial coefficients packed into ...
Definition xoshiro.h:748

xso::generator::discard
void discard(std::uint64_t z)
Discards the next z iterations in the random number sequence.
Definition xoshiro.h:614

xso::generator::index
constexpr T index(T len)
Sampling method that returns a single index from a uniform distribution over [0, len-1].
Definition xoshiro.h:381

xso::generator::seed
constexpr void seed()
Seeds the full state to random starting values.
Definition xoshiro.h:216

xso::generator::generator
constexpr generator(word_type s)
Construct a generator quickly but not well from a single unsigned integer value.
Definition xoshiro.h:174

xso::generator::operator()
constexpr result_type operator()()
Returns the next random value from the generator which is a result_type unsigned integer.
Definition xoshiro.h:302

xso::generator::generator
constexpr generator(Iter b, Iter e)
Construct and seed from an iteration of unsigned words which are all copied into the state.
Definition xoshiro.h:195

xso::generator::word_type
typename State::word_type word_type
This generator type packs its state into words of this type (in practice, 32 or 64 bit unsigneds).
Definition xoshiro.h:81

xso::generator::jump
constexpr auto jump(std::size_t n, bool n_is_log2=false)
Jumps the generator's state forward by J steps where J is either n or 2^n to accommodate huge jumps t...
Definition xoshiro.h:642

xso::generator::scrambler_type
Scrambler scrambler_type
The Scrambler used for by generator type – one of the scrambler classes defined below.
Definition xoshiro.h:78

xso::generator::sample
constexpr T sample(T a, T b)
Sampling method that returns a single integer value from a uniform distribution over [a,...
Definition xoshiro.h:343

xso::generator::sample
constexpr auto sample(Distribution auto &dist)
Sampling method that returns a single random variate drawn from a distribution.
Definition xoshiro.h:508

xso::generator::characteristic_coefficients
static constexpr void characteristic_coefficients(Dst dst)
Class method that fills a destination iterator with the state's precomputed characteristic polynomial...
Definition xoshiro.h:728

xso::generator::get_state
constexpr void get_state(Dst dst) const
Copies the whole state into the destination iterator dst.
Definition xoshiro.h:320

xso::generator::shuffle
constexpr void shuffle(Iter b, Iter e)
This method shuffles the elements in an iteration.
Definition xoshiro.h:581

xso::generator::sample
constexpr auto sample(T b, T e)
Sampling method that returns a single value from an iteration – all elements are equally likely to be...
Definition xoshiro.h:402

xso::generator::sample
constexpr auto sample(const Container &container)
Sampling method that returns a single value from a container – all elements are equally likely to be ...
Definition xoshiro.h:433

xso::generator::result_type
word_type result_type
The unsigned integer type returned by the generator's operator()() method.
Definition xoshiro.h:125

xso::generator::jump
void jump(gf2::BitPolynomial< word_type > const &jump_poly)
Jumps a state/generator ahead in its random number stream by J steps.
Definition xoshiro.h:763

xso::partition::partition
partition(const RNG &rng, std::size_t n_partitions)
Constructs a partition for the passed parent random number generator rng.
Definition xoshiro.h:1243

xso::partition::next
RNG next()
Returns the next generator that is seeded at the start of the next sub-stream of the parent random nu...
Definition xoshiro.h:1266

xso::xoroshiro
The state for the Xoroshiro family of pseudorandom number generators.
Definition xoshiro.h:958

xso::xoroshiro::type_string
static constexpr auto type_string()
Class method that returns a name for this state.
Definition xoshiro.h:973

xso::xoroshiro::get_state
constexpr void get_state(Dst dst) const
Copies the whole state into the destination iterator dst.
Definition xoshiro.h:989

xso::xoroshiro::step
constexpr void step()
Advance the state by one step.
Definition xoshiro.h:1008

xso::xoroshiro::word_type
T word_type
The type of the words of state.
Definition xoshiro.h:961

xso::xoroshiro::operator[]
constexpr T operator[](std::size_t i) const
Returns the i'th state word.
Definition xoshiro.h:980

xso::xoroshiro::bit_count
static constexpr std::size_t bit_count()
Class method that returns the number of bits of state.
Definition xoshiro.h:970

xso::xoroshiro::characteristic_coefficients
static constexpr auto characteristic_coefficients()
Class method that returns the state's precomputed characteristic polynomial coefficients packed into ...
Definition xoshiro.h:1055

xso::xoroshiro::word_count
static constexpr std::size_t word_count()
Class method that returns the number of words in the underlying state.
Definition xoshiro.h:967

xso::xoroshiro::seed
constexpr void seed(Src b, Src e)
Sets the state from an iteration of words.
Definition xoshiro.h:1000

xso::xoroshiro::characteristic_coefficients
static constexpr void characteristic_coefficients(Dst dst)
Class method that fills a destination iterator with our precomputed characteristic polynomial coeffic...
Definition xoshiro.h:1025

xso::xoroshiro::array_type
std::array< T, N > array_type
A convenience container type to hold the full state of this generator, jump polynomial coefficients,...
Definition xoshiro.h:964

xso::xoshiro
The state for the Xoshiro family of pseudorandom number generators.
Definition xoshiro.h:829

xso::xoshiro::operator[]
constexpr T operator[](std::size_t i) const
Returns the i'th state word.
Definition xoshiro.h:849

xso::xoshiro::step
constexpr void step()
Advance the state by one step.
Definition xoshiro.h:877

xso::xoshiro::characteristic_coefficients
static constexpr auto characteristic_coefficients()
Class method that returns the state's precomputed characteristic polynomial coefficients packed into ...
Definition xoshiro.h:939

xso::xoshiro::word_count
static constexpr std::size_t word_count()
Class method that returns the number of words in the underlying state.
Definition xoshiro.h:838

xso::xoshiro::bit_count
static constexpr std::size_t bit_count()
Class method that returns the number of bits of state.
Definition xoshiro.h:841

xso::xoshiro::word_type
T word_type
The state is stored as an array of N words of type T.
Definition xoshiro.h:832

xso::xoshiro::characteristic_coefficients
static constexpr void characteristic_coefficients(Dst dst)
Class method that fills a destination iterator with our precomputed characteristic polynomial coeffic...
Definition xoshiro.h:913

xso::xoshiro::array_type
std::array< T, N > array_type
A convenience container type to hold the full state of this generator, jump polynomial coefficients,...
Definition xoshiro.h:835

xso::xoshiro::type_string
static constexpr auto type_string()
Class method that returns a name for this type of state.
Definition xoshiro.h:844

xso::xoshiro::get_state
constexpr void get_state(Dst dst) const
Copies the whole state into the destination iterator dst.
Definition xoshiro.h:856

xso::xoshiro::seed
constexpr void seed(Src b, Src e)
Sets the state from an iteration of words.
Definition xoshiro.h:867

xso::Distribution
A C++ concept that lets us distinguish standard distribution types from other types.
Definition xoshiro.h:46

std::formatter< T >::format
auto format(const T &, FormatContext &ctx) const
Push out a formatted xso::generator using its type_string() method.
Definition xoshiro.h:1681

std::formatter< T >::parse
constexpr auto parse(const std::format_parse_context &ctx)
Parse the format specifier – currently only handle the default empty specifier.
Definition xoshiro.h:1673

xso::plus_plus
The plus_plus scrambler is passed a state array an returns rotl(state[w0] + state[w1],...
Definition xoshiro.h:1162

xso::plus
The plus scrambler is passed a state array an returns state[w0] + state[w1].
Definition xoshiro.h:1150

xso::star_star
The star_star scrambler is passed a state array an returns T * rotl(S * state[w], R) where:
Definition xoshiro.h:1136

xso::star
The star scrambler is passed a state array and will return S * state[w] where:
Definition xoshiro.h:1119

xso::transition_matrix
auto transition_matrix()
Returns the transition matrix for a state/generator type as a gf2::BitMatrix.
Definition xoshiro.h:1583

xso::rng32
xoshiro_4x32_star_star rng32
The recommended 32-bit output generator – used as xso::rng32.
Definition xoshiro.h:1207

operator<<
std::ostream & operator<<(std::ostream &s, const T &)
The usual output stream operator for an xso::generator, State, or Scrambler.
Definition xoshiro.h:1691

xso::rng
rng64 rng
The recommended default generator for most usage – used as xso::rng.
Definition xoshiro.h:1213

xso::jump_coefficients
constexpr auto jump_coefficients(std::size_t J, bool J_is_log2=false)
Returns the coefficients of the jump polynomial that can be used to jump a generator/state ahead by  ...
Definition xoshiro.h:1303

xso::rng64
xoshiro_4x64_star_star rng64
The recommended 64-bit output generator – used as xso::rng64.
Definition xoshiro.h:1210

xso::characteristic_polynomial
auto characteristic_polynomial()
Returns the characteristic polynomial for our state's transition matrix as a gf2::BitPolynomial.
Definition xoshiro.h:1634

xso::jump_polynomial
auto jump_polynomial(gf2::BitPolynomial< typename State::word_type > const &c, std::size_t N, bool N_is_log2=false)
Returns a jump polynomial that moves the generator type J steps ahead in its random number stream.
Definition xoshiro.h:1648