// Copyright 2017-2019 Peter Dimov. // Distributed under the Boost Software License, Version 1.0. #define _CRT_SECURE_NO_WARNINGS #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include class mul31_32 { private: boost::uint32_t st_; public: typedef boost::uint32_t result_type; typedef boost::uint32_t size_type; mul31_32(): st_( 0x811C9DC5ul ) { } explicit mul31_32( boost::uint64_t seed ): st_( 0x811C9DC5ul ^ ( seed & 0xFFFFFFFFu ) ^ ( seed >> 32 ) ) { } void update( boost::hash2::byte_type const * p, std::ptrdiff_t n ) { boost::uint32_t h = st_; for( std::ptrdiff_t i = 0; i < n; ++i ) { h = h * 31 + static_cast( p[i] ); } st_ = h; } boost::uint32_t result() { boost::uint32_t r = st_; st_ = st_ * 31 + 0xFF; return r; } }; class mul31_64 { private: boost::uint64_t st_; public: typedef boost::uint64_t result_type; typedef boost::uint64_t size_type; mul31_64(): st_( 0xCBF29CE484222325ull ) { } explicit mul31_64( boost::uint64_t seed ): st_( 0xCBF29CE484222325ull ^ seed ) { } void update( boost::hash2::byte_type const * p, std::ptrdiff_t n ) { boost::uint64_t h = st_; for( std::ptrdiff_t i = 0; i < n; ++i ) { h = h * 31 + static_cast( p[i] ); } st_ = h; } boost::uint64_t result() { boost::uint64_t r = st_; st_ = st_ * 31 + 0xFF; return r; } }; template class hasher { private: std::size_t seed_; public: explicit hasher( std::size_t seed ): seed_( seed ) { } template std::size_t operator()( T const& v ) const { H h( seed_ ); using boost::hash2::hash_append; hash_append( h, v ); using boost::hash2::get_integral_result; return get_integral_result( h.result() ); } }; template void test4( int N, V const& v, char const * hash, char const* seed_text, S s ) { typedef boost::chrono::steady_clock clock_type; clock_type::time_point t1 = clock_type::now(); for( int i = 0; i < N; ++i ) { s.insert( v[ i * 16 ] ); } clock_type::time_point t2 = clock_type::now(); std::size_t q = 0; for( int i = 0; i < 16 * N; ++i ) { q += s.count( v[ i ] ); } clock_type::time_point t3 = clock_type::now(); long long ms1 = boost::chrono::duration_cast( t2 - t1 ).count(); long long ms2 = boost::chrono::duration_cast( t3 - t2 ).count(); std::size_t n = s.bucket_count(); std::size_t m = 0; for( std::size_t i = 0; i < n; ++i ) { std::size_t k = s.bucket_size( i ); if( k > m ) { m = k; } } #if defined( _MSC_VER ) std::printf( "%s(%s): n=%Iu, m=%Iu, q=%Iu, %lld + %lld ms\n", hash, seed_text, n, m, q, ms1, ms2 ); #else std::printf( "%s(%s): n=%zu, m=%zu, q=%zu, %lld + %lld ms\n", hash, seed_text, n, m, q, ms1, ms2 ); #endif } template void test3( int N, V const& v, char const* seed_text, std::size_t seed ) { boost::unordered_set< K, hasher > s( 0, hasher( seed ) ); test4( N, v, boost::core::demangle( typeid(H).name() ).c_str(), seed_text, s ); } template void test2( int N, V const& v ) { test3( N, v, "0", 0 ); test3( N, v, "1", 1 ); test3( N, v, "~0", ~static_cast( 0 ) ); std::puts( "" ); } int main() { int const N = 1048576; std::vector v; { v.reserve( N * 16 ); boost::mt19937_64 rnd; for( int i = 0; i < 16 * N; ++i ) { unsigned long long k = rnd(); char buffer[ 64 ]; sprintf( buffer, "prefix_%llu_suffix", k ); v.push_back( buffer ); } } typedef std::string K; { boost::unordered_set s; test4( N, v, "default", "0", s ); std::puts( "" ); } test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); test2( N, v ); std::puts( "" ); }