Распределения и внутреннее состояние

В Stackoverflow есть много вопросов о создании равномерно распределенных целых чисел из неизвестных неизвестных диапазонов. Например.

Типичное решение - это что-то вроде:

inline std::mt19937 &engine()
{
  thread_local std::mt19937 eng;
  return eng;
}

int get_int_from_range(int from, int to)
{
  std::uniform_int_distribution<int> dist(from, to);
  return dist(engine());
}

Учитывая, что распределение должно быть легким объектом, и нет проблем с производительностью, воссоздающих его несколько раз, кажется, что даже простое распространение может очень хорошо и обычно будет некоторое внутреннее состояние.

Итак, мне было интересно, не мешало ли это распределению работать, постоянно перезагружая его (т.е. воссоздавая распределение при каждом вызове get_int_from_range). Я получаю правильно распределенные результаты.

Там длительное обсуждение между Пит Беккер и Стивом Джессопом, но без окончательного слова. В другом вопросе (Должен ли я хранить экземпляр объекта случайного распределения или я могу его воссоздать?) "проблема" внутреннего состояния не кажется очень важной.

Предоставляет ли стандарт С++ какие-либо гарантии в отношении этой темы?

Является ли следующая реализация (от N4316 - std:: rand replacement) несколько более надежной?

int get_int_from_range(int from, int to)
{
  using distribution_type = std::uniform_int_distribution<int>;
  using param_type = typename distribution_type::param_type;

  thread_local std::uniform_int_distribution<int> dist;
  return dist(engine(), param_type(from, to));    
}

ИЗМЕНИТЬ

Это повторяет возможное внутреннее состояние распределения, но оно сложное, и я не уверен, что он стоит того, чтобы справиться с проблемой:

int get_int_from_range(int from, int to)
{
  using range_t = std::pair<int, int>;
  using map_t = std::map<range_t, std::uniform_int_distribution<int>>;

  thread_local map_t range_map;

  auto i = range_map.find(range_t(from, to));
  if (i == std::end(range_map))
    i = range_map.emplace(
          std::make_pair(from, to),
          std::uniform_int_distribution<int>{from, to}).first;

  return i->second(engine());
}

^{(из qaru.site/info/294471/...)}

#include <random> #include <memory> #include <chrono> #include <utility> typedef std::mt19937_64 engine_type; inline size_t get_seed() { return std::chrono::system_clock::now().time_since_epoch().count(); } engine_type& engine_singleton() { static std::unique_ptr<engine_type> ptr; if ( !ptr ) ptr.reset( new engine_type(get_seed()) ); return *ptr; } // ------------------------------------------------------------------------ #include <cmath> #include <cstdio> #include <vector> #include <string> #include <algorithm> void plot_distribution( const std::vector<double>& D, size_t mass = 200 ) { const size_t n = D.size(); for ( size_t i = 0; i < n; ++i ) { printf("%02ld: %s\n", i, std::string(static_cast<size_t>(D[i]*mass),'*').c_str() ); } } double maximum_difference( const std::vector<double>& x, const std::vector<double>& y ) { const size_t n = x.size(); double m = 0.0; for ( size_t i = 0; i < n; ++i ) m = std::max( m, std::abs(x[i]-y[i]) ); return m; }

#include <iostream> #include <vector> #include <cstdio> #include <random> #include <string> #include <cmath> void compare_uniform_distributions( int lo, int hi ) { const size_t sample_size = 1e5; // Initialize histograms std::vector<double> H1( hi-lo+1, 0.0 ), H2( hi-lo+1, 0.0 ); // Initialize distribution auto U = std::uniform_int_distribution<int>(lo,hi); // Count! for ( size_t i = 0; i < sample_size; ++i ) { engine_type E(get_seed()); H1[ U(engine_singleton())-lo ] += 1.0; H2[ U(E)-lo ] += 1.0; } // Normalize histograms to obtain "densities" for ( size_t i = 0; i < H1.size(); ++i ) { H1[i] /= sample_size; H2[i] /= sample_size; } printf("Engine singleton:\n"); plot_distribution(H1); printf("Engine creation :\n"); plot_distribution(H2); printf("Maximum difference: %.3f\n", maximum_difference(H1,H2) ); std::cout<< std::string(50,'-') << std::endl << std::endl; } void compare_poisson_distributions( double mean ) { const size_t sample_size = 1e5; const size_t nbins = static_cast<size_t>(std::ceil(2*mean)); // Initialize histograms std::vector<double> H1( nbins, 0.0 ), H2( nbins, 0.0 ); // Initialize distribution auto U = std::poisson_distribution<int>(mean); // Count! for ( size_t i = 0; i < sample_size; ++i ) { engine_type E(get_seed()); int u1 = U(engine_singleton()); int u2 = U(E); if (u1 < nbins) H1[u1] += 1.0; if (u2 < nbins) H2[u2] += 1.0; } // Normalize histograms to obtain "densities" for ( size_t i = 0; i < H1.size(); ++i ) { H1[i] /= sample_size; H2[i] /= sample_size; } printf("Engine singleton:\n"); plot_distribution(H1); printf("Engine creation :\n"); plot_distribution(H2); printf("Maximum difference: %.3f\n", maximum_difference(H1,H2) ); std::cout<< std::string(50,'-') << std::endl << std::endl; } // ------------------------------------------------------------------------ int main() { compare_uniform_distributions( 0, 25 ); compare_poisson_distributions( 12 ); }

#include <random> #include <chrono> #include <utility> #include <functional> inline size_t get_seed() { return std::chrono::system_clock::now().time_since_epoch().count(); } template <class Distrib> using generator_type = std::function< typename Distrib::result_type () >; template <class Distrib, class Engine = std::mt19937_64, class... Args> inline generator_type<Distrib> get_generator( Args&&... args ) { return std::bind( Distrib( std::forward<Args>(args)... ), Engine(get_seed()) ); } // ------------------------------------------------------------------------ #include <iostream> int main() { auto U = get_generator<std::uniform_int_distribution<int>>(0,10); std::cout<< U() << std::endl; }

Ответ 1