194 lines
6.2 KiB
Plaintext
194 lines
6.2 KiB
Plaintext
|
//---------------------------------------------------------------------------//
|
||
|
// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
|
||
|
//
|
||
|
// Distributed under the Boost Software License, Version 1.0
|
||
|
// See accompanying file LICENSE_1_0.txt or copy at
|
||
|
// http://www.boost.org/LICENSE_1_0.txt
|
||
|
//
|
||
|
// See http://boostorg.github.com/compute for more information.
|
||
|
//---------------------------------------------------------------------------//
|
||
|
|
||
|
#ifndef BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP
|
||
|
#define BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP
|
||
|
|
||
|
#include <iterator>
|
||
|
|
||
|
#include <boost/utility/addressof.hpp>
|
||
|
|
||
|
#include <boost/compute/command_queue.hpp>
|
||
|
#include <boost/compute/async/future.hpp>
|
||
|
#include <boost/compute/iterator/buffer_iterator.hpp>
|
||
|
#include <boost/compute/memory/svm_ptr.hpp>
|
||
|
|
||
|
namespace boost {
|
||
|
namespace compute {
|
||
|
namespace detail {
|
||
|
|
||
|
template<class HostIterator, class DeviceIterator>
|
||
|
inline DeviceIterator copy_to_device(HostIterator first,
|
||
|
HostIterator last,
|
||
|
DeviceIterator result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::value_type
|
||
|
value_type;
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::difference_type
|
||
|
difference_type;
|
||
|
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
size_t offset = result.get_index();
|
||
|
|
||
|
queue.enqueue_write_buffer(result.get_buffer(),
|
||
|
offset * sizeof(value_type),
|
||
|
count * sizeof(value_type),
|
||
|
::boost::addressof(*first));
|
||
|
|
||
|
return result + static_cast<difference_type>(count);
|
||
|
}
|
||
|
|
||
|
template<class HostIterator, class DeviceIterator>
|
||
|
inline DeviceIterator copy_to_device_map(HostIterator first,
|
||
|
HostIterator last,
|
||
|
DeviceIterator result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::value_type
|
||
|
value_type;
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::difference_type
|
||
|
difference_type;
|
||
|
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
size_t offset = result.get_index();
|
||
|
|
||
|
// map result buffer to host
|
||
|
value_type *pointer = static_cast<value_type*>(
|
||
|
queue.enqueue_map_buffer(
|
||
|
result.get_buffer(),
|
||
|
CL_MAP_WRITE,
|
||
|
offset * sizeof(value_type),
|
||
|
count * sizeof(value_type)
|
||
|
)
|
||
|
);
|
||
|
|
||
|
// copy [first; last) to result buffer
|
||
|
std::copy(first, last, pointer);
|
||
|
|
||
|
// unmap result buffer
|
||
|
boost::compute::event unmap_event = queue.enqueue_unmap_buffer(
|
||
|
result.get_buffer(),
|
||
|
static_cast<void*>(pointer)
|
||
|
);
|
||
|
unmap_event.wait();
|
||
|
|
||
|
return result + static_cast<difference_type>(count);
|
||
|
}
|
||
|
|
||
|
template<class HostIterator, class DeviceIterator>
|
||
|
inline future<DeviceIterator> copy_to_device_async(HostIterator first,
|
||
|
HostIterator last,
|
||
|
DeviceIterator result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::value_type
|
||
|
value_type;
|
||
|
typedef typename
|
||
|
std::iterator_traits<DeviceIterator>::difference_type
|
||
|
difference_type;
|
||
|
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return future<DeviceIterator>();
|
||
|
}
|
||
|
|
||
|
size_t offset = result.get_index();
|
||
|
|
||
|
event event_ =
|
||
|
queue.enqueue_write_buffer_async(result.get_buffer(),
|
||
|
offset * sizeof(value_type),
|
||
|
count * sizeof(value_type),
|
||
|
::boost::addressof(*first));
|
||
|
|
||
|
return make_future(result + static_cast<difference_type>(count), event_);
|
||
|
}
|
||
|
|
||
|
#ifdef CL_VERSION_2_0
|
||
|
// copy_to_device() specialization for svm_ptr
|
||
|
template<class HostIterator, class T>
|
||
|
inline svm_ptr<T> copy_to_device(HostIterator first,
|
||
|
HostIterator last,
|
||
|
svm_ptr<T> result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
queue.enqueue_svm_memcpy(
|
||
|
result.get(), ::boost::addressof(*first), count * sizeof(T)
|
||
|
);
|
||
|
|
||
|
return result + count;
|
||
|
}
|
||
|
|
||
|
template<class HostIterator, class T>
|
||
|
inline future<svm_ptr<T> > copy_to_device_async(HostIterator first,
|
||
|
HostIterator last,
|
||
|
svm_ptr<T> result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return future<svm_ptr<T> >();
|
||
|
}
|
||
|
|
||
|
event event_ = queue.enqueue_svm_memcpy_async(
|
||
|
result.get(), ::boost::addressof(*first), count * sizeof(T)
|
||
|
);
|
||
|
|
||
|
return make_future(result + count, event_);
|
||
|
}
|
||
|
|
||
|
template<class HostIterator, class T>
|
||
|
inline svm_ptr<T> copy_to_device_map(HostIterator first,
|
||
|
HostIterator last,
|
||
|
svm_ptr<T> result,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
size_t count = iterator_range_size(first, last);
|
||
|
if(count == 0){
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
// map
|
||
|
queue.enqueue_svm_map(result.get(), count * sizeof(T), CL_MAP_WRITE);
|
||
|
|
||
|
// copy [first; last) to result buffer
|
||
|
std::copy(first, last, static_cast<T*>(result.get()));
|
||
|
|
||
|
// unmap result
|
||
|
queue.enqueue_svm_unmap(result.get()).wait();
|
||
|
|
||
|
return result + count;
|
||
|
}
|
||
|
#endif // CL_VERSION_2_0
|
||
|
|
||
|
} // end detail namespace
|
||
|
} // end compute namespace
|
||
|
} // end boost namespace
|
||
|
|
||
|
#endif // BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP
|