2
0
mirror of https://github.com/boostorg/compute.git synced 2026-01-26 18:32:48 +00:00
Files
compute/perf/perf_copy_to_device.cpp
Kyle Lutz 3bc5bfaf78 Remove timer class
This removes the timer class. The technique of measuring the time
difference between two different OpenCL markers on a command queue
is not portable to all OpenCL implementations (only works on NVIDIA).

A new internal timer class has been added which uses boost::chrono
(or std::chrono if BOOST_COMPUTE_TIMER_USE_STD_CHRONO is defined).
This new timer is used by the benchmarks to measure time elapsed
on the host.
2013-05-20 21:08:42 -04:00

63 lines
2.0 KiB
C++

//---------------------------------------------------------------------------//
// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
//
// Distributed under the Boost Software License, Version 1.0
// See accompanying file LICENSE_1_0.txt or copy at
// http://www.boost.org/LICENSE_1_0.txt
//
// See http://kylelutz.github.com/compute for more information.
//---------------------------------------------------------------------------//
#include <vector>
#include <cstdlib>
#include <iostream>
#include <boost/compute.hpp>
int main(int argc, char *argv[])
{
size_t size = 1000;
if(argc >= 2){
size = boost::lexical_cast<size_t>(argv[1]);
}
boost::compute::device device = boost::compute::system::default_device();
boost::compute::context context(device);
boost::compute::command_queue::properties
properties = boost::compute::command_queue::enable_profiling;
boost::compute::command_queue queue(context, device, properties);
std::vector<int> host_vector(size);
std::generate(host_vector.begin(), host_vector.end(), rand);
boost::compute::vector<int> device_vector(host_vector.size(), context);
boost::compute::future<void> future =
boost::compute::copy_async(host_vector.begin(),
host_vector.end(),
device_vector.begin(),
queue);
// wait for copy to finish
future.wait();
using boost::compute::ulong_;
ulong_ start_time =
future.get_event().get_profiling_info<ulong_>(
boost::compute::event::profiling_command_start
);
ulong_ end_time =
future.get_event().get_profiling_info<ulong_>(
boost::compute::event::profiling_command_end
);
size_t elapsed = end_time - start_time;
std::cout << "time: " << elapsed / 1e6 << " ms" << std::endl;
float rate = (float(size * sizeof(int)) / elapsed) * 1000.f;
std::cout << "rate: " << rate << " MB/s" << std::endl;
return 0;
}