/* boost random_speed.cpp performance measurements * * Copyright Jens Maurer 2000 * Permission to use, copy, modify, sell, and distribute this software * is hereby granted without fee provided that the above copyright notice * appears in all copies and that both that copyright notice and this * permission notice appear in supporting documentation, * * Jens Maurer makes no representations about the suitability of this * software for any purpose. It is provided "as is" without express or * implied warranty. * * $Id$ */ #include #include #include #include #include #include /* * Configuration Section */ // define if your C library supports the non-standard drand48 family #undef HAVE_DRAND48 // define if you have the original mt19937int.c (with commented out main()) #undef HAVE_MT19937INT_C // set to your CPU frequency in MHz static const double cpu_frequency = 200 * 1e6; /* * End of Configuration Section */ /* * General portability note: * MSVC mis-compiles explicit function template instantiations. * For example, f() and f() are both compiled to call f(). * BCC is unable to implicitly convert a "const char *" to a std::string * when using explicit function template instantiations. * * Therefore, avoid explicit function template instantiations. */ // provides a run-time configurable linear congruential generator, just // for comparison template class linear_congruential { public: typedef IntType result_type; BOOST_STATIC_CONSTANT(bool, has_fixed_range = false); linear_congruential(IntType x0, IntType a, IntType c, IntType m) : _x(x0), _a(a), _c(c), _m(m) { } // compiler-generated copy ctor and assignment operator are fine void seed(IntType x0, IntType a, IntType c, IntType m) { _x = x0; _a = a; _c = c; _m = m; } void seed(IntType x0) { _x = x0; } result_type operator()() { _x = (_a*_x+_c) % _m; return _x; } result_type min() const { return _c == 0 ? 1 : 0; } result_type max() const { return _m -1; } private: IntType _x, _a, _c, _m; }; // simplest "random" number generator possible, to check on overhead class counting { public: typedef int result_type; BOOST_STATIC_CONSTANT(bool, has_fixed_range = false); counting() : _x(0) { } result_type operator()() { return ++_x; } result_type min() const { return 1; } result_type max() const { return std::numeric_limits::max(); } private: int _x; }; // make distributions (and underlying engines) runtime-exchangeable, // for speed comparison template class DistributionBase { public: virtual void reset() = 0; virtual Ret operator()() = 0; virtual ~DistributionBase() { } }; template class Distribution : public DistributionBase { public: Distribution(const Dist& d) : _d(d) { } void reset() { _d.reset(); } Ret operator()() { return _d(); } private: Dist _d; }; template class GenericDistribution { public: typedef Ret result_type; GenericDistribution() { }; void set(boost::shared_ptr > p) { _p = p; } // takes over ownership void set(DistributionBase * p) { _p.reset(p); } Ret operator()() { return (*_p)(); } private: boost::shared_ptr > _p; }; // start implementation of measuring timing void show_elapsed(double end, int iter, const std::string & name) { double usec = end/iter*1e6; double cycles = usec * cpu_frequency/1e6; std::cout << name << ": " << usec*1e3 << " nsec/loop = " << cycles << " CPU cycles" << std::endl; } template void timing(RNG & rng, int iter, const std::string& name) { // make sure we're not optimizing too much volatile typename RNG::result_type tmp; boost::timer t; for(int i = 0; i < iter; i++) tmp = rng(); show_elapsed(t.elapsed(), iter, name); } template void timing_sphere(RNG & rng, int iter, const std::string & name) { boost::timer t; for(int i = 0; i < iter; i++) { // the special return value convention of uniform_on_sphere saves 20% CPU const std::vector & tmp = rng(); (void) tmp[0]; } show_elapsed(t.elapsed(), iter, name); } template void run(int iter, const std::string & name, const RNG &) { RNG rng; std::cout << (RNG::has_fixed_range ? "fixed-range " : ""); // BCC has trouble with string autoconversion for explicit specializations timing(rng, iter, std::string(name)); } #ifdef HAVE_DRAND48 // requires non-standard C library support for srand48/lrand48 void run(int iter, const std::string & name, int) { std::srand48(1); timing(std::lrand48, iter, name); } #endif #ifdef HAVE_MT19937INT_C // requires the original mt19937int.c extern "C" void sgenrand(unsigned long); extern "C" unsigned long genrand(); void run(int iter, const std::string & name, float) { sgenrand(4357); timing(genrand, iter, name, 0u); } #endif template void distrib(int iter, const std::string & name, const Gen &) { Gen gen; boost::uniform_smallint usmallint(gen, -2, 4); timing(usmallint, iter, name + " uniform_smallint"); boost::uniform_int uint(gen, -2, 4); timing(uint, iter, name + " uniform_int"); boost::geometric_distribution geo(gen, 0.5); timing(geo, iter, name + " geometric"); boost::uniform_01 uni(gen); timing(uni, iter, name + " uniform_01"); boost::uniform_real ur(gen, -5.3, 4.8); timing(ur, iter, name + " uniform_real"); boost::triangle_distribution tria(gen, 1, 2, 7); timing(tria, iter, name + " triangle"); boost::exponential_distribution ex(gen, 3); timing(ex, iter, name + " exponential"); boost::normal_distribution no2(gen); timing(no2, iter, name + " normal polar"); boost::lognormal_distribution lnorm(gen, 1, 1); timing(lnorm, iter, name + " lognormal"); boost::cauchy_distribution cauchy(gen); timing(cauchy, iter, name + " cauchy"); boost::gamma_distribution gamma(gen, 0.4); timing(gamma, iter, name + " gamma"); boost::uniform_on_sphere usph(gen, 3); timing_sphere(usph, iter/10, name + " uniform_on_sphere"); } template void distrib_runtime(int iter, const std::string & n, const Gen &) { std::string name = n + " virtual function "; Gen gen; GenericDistribution g_int; boost::uniform_smallint usmallint(gen, -2, 4); g_int.set(new Distribution >(usmallint)); timing(g_int, iter, name + "uniform_smallint"); boost::uniform_int uint(gen, -2, 4); g_int.set(new Distribution >(uint)); timing(g_int, iter, name + "uniform_int"); boost::geometric_distribution geo(gen, 0.5); g_int.set(new Distribution >(geo)); timing(g_int, iter, name + "geometric"); GenericDistribution g; boost::uniform_01 uni(gen); g.set(new Distribution >(uni)); timing(g, iter, name + "uniform_01"); boost::uniform_real ur(gen, -5.3, 4.8); g.set(new Distribution >(ur)); timing(g, iter, name + "uniform_real"); boost::triangle_distribution tria(gen, 1, 2, 7); g.set(new Distribution >(tria)); timing(g, iter, name + "triangle"); boost::exponential_distribution ex(gen, 3); g.set(new Distribution >(ex)); timing(g, iter, name + "exponential"); boost::normal_distribution no2(gen); g.set(new Distribution >(no2)); timing(g, iter, name + "normal polar"); boost::lognormal_distribution lnorm(gen, 1, 1); g.set(new Distribution >(lnorm)); timing(g, iter, name + "lognormal"); boost::cauchy_distribution cauchy(gen); g.set(new Distribution >(cauchy)); timing(g, iter, name + "cauchy"); boost::gamma_distribution gamma(gen, 0.4); g.set(new Distribution >(gamma)); timing(g, iter, name + "gamma"); } int main(int argc, char*argv[]) { if(argc != 2) { std::cerr << "usage: " << argv[0] << " iterations" << std::endl; return 1; } // okay, it's ugly, but it's only used here int iter = #ifndef BOOST_NO_STDC_NAMESPACE std:: #endif atoi(argv[1]); #if !defined(BOOST_NO_INT64_T) && \ !defined(BOOST_NO_INCLASS_MEMBER_INITIALIZATION) run(iter, "rand48", boost::rand48()); linear_congruential lcg48(boost::uint64_t(1)<<16 | 0x330e, boost::uint64_t(0xDEECE66DUL) | (boost::uint64_t(0x5) << 32), 0xB, boost::uint64_t(1)<<48); timing(lcg48, iter, "lrand48 run-time"); #endif #ifdef HAVE_DRAND48 // requires non-standard C library support for srand48/lrand48 run(iter, "lrand48", 0); // coded for lrand48() #endif run(iter, "minstd_rand", boost::minstd_rand()); run(iter, "ecuyer combined", boost::ecuyer1988()); run(iter, "kreutzer1986", boost::kreutzer1986()); run(iter, "hellekalek1995 (inversive)", boost::hellekalek1995()); run(iter, "mt11213b", boost::mt11213b()); run(iter, "mt19937", boost::mt19937()); run(iter, "subtract_with_carry", boost::random::ranlux_base()); run(iter, "subtract_with_carry_01", boost::random::ranlux_base_01()); run(iter, "ranlux3", boost::ranlux3()); run(iter, "ranlux4", boost::ranlux4()); run(iter, "ranlux3_01", boost::ranlux3_01()); run(iter, "ranlux4_01", boost::ranlux4_01()); run(iter, "counting", counting()); #ifdef HAVE_MT19937INT_C // requires the original mt19937int.c run(iter, "mt19937 original"); // coded for sgenrand()/genrand() #endif distrib(iter, "counting", counting()); distrib_runtime(iter, "counting", counting()); distrib(iter, "minstd_rand", boost::minstd_rand()); distrib(iter, "kreutzer1986", boost::kreutzer1986()); distrib(iter, "mt19937", boost::mt19937()); distrib_runtime(iter, "mt19937", boost::mt19937()); }