2
0
mirror of https://github.com/boostorg/compute.git synced 2026-01-28 07:02:15 +00:00
Files
compute/perf/perf_copy_to_device.cpp
Kyle Lutz ec11d8cdc4 Add third-party perf tests
This adds third-party performance tests to use in comparing
Boost.Compute with other parallel/GPGPU frameworks like Intel's
TBB and NVIDIA's Thrust along with the C++ STL.

Also refactors the timing and profiling infrastructure and adds
a simple perf.py driver script for running performance tests.
2014-02-02 13:12:17 -08:00

63 lines
2.0 KiB
C++

//---------------------------------------------------------------------------//
// Copyright (c) 2013-2014 Kyle Lutz <kyle.r.lutz@gmail.com>
//
// Distributed under the Boost Software License, Version 1.0
// See accompanying file LICENSE_1_0.txt or copy at
// http://www.boost.org/LICENSE_1_0.txt
//
// See http://kylelutz.github.com/compute for more information.
//---------------------------------------------------------------------------//
#include <vector>
#include <cstdlib>
#include <iostream>
#include <boost/compute.hpp>
int main(int argc, char *argv[])
{
size_t size = 1000;
if(argc >= 2){
size = boost::lexical_cast<size_t>(argv[1]);
}
boost::compute::device device = boost::compute::system::default_device();
boost::compute::context context(device);
boost::compute::command_queue::properties
properties = boost::compute::command_queue::enable_profiling;
boost::compute::command_queue queue(context, device, properties);
std::vector<int> host_vector(size);
std::generate(host_vector.begin(), host_vector.end(), rand);
boost::compute::vector<int> device_vector(host_vector.size(), context);
boost::compute::future<void> future =
boost::compute::copy_async(host_vector.begin(),
host_vector.end(),
device_vector.begin(),
queue);
// wait for copy to finish
future.wait();
using boost::compute::ulong_;
ulong_ start_time =
future.get_event().get_profiling_info<ulong_>(
boost::compute::event::profiling_command_start
);
ulong_ end_time =
future.get_event().get_profiling_info<ulong_>(
boost::compute::event::profiling_command_end
);
size_t elapsed = end_time - start_time;
std::cout << "time: " << elapsed / 1e6 << " ms" << std::endl;
float rate = (float(size * sizeof(int)) / elapsed) * 1000.f;
std::cout << "rate: " << rate << " MB/s" << std::endl;
return 0;
}