//---------------------------------------------------------------------------// // Copyright (c) 2013 Kyle Lutz // // Distributed under the Boost Software License, Version 1.0 // See accompanying file LICENSE_1_0.txt or copy at // http://www.boost.org/LICENSE_1_0.txt // // See http://boostorg.github.com/compute for more information. //---------------------------------------------------------------------------// #ifndef BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP #define BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP #include #include #include #include #include #include namespace boost { namespace compute { namespace detail { template inline DeviceIterator copy_to_device(HostIterator first, HostIterator last, DeviceIterator result, command_queue &queue) { typedef typename std::iterator_traits::value_type value_type; typedef typename std::iterator_traits::difference_type difference_type; size_t count = iterator_range_size(first, last); if(count == 0){ return result; } size_t offset = result.get_index(); queue.enqueue_write_buffer(result.get_buffer(), offset * sizeof(value_type), count * sizeof(value_type), ::boost::addressof(*first)); return result + static_cast(count); } template inline DeviceIterator copy_to_device_map(HostIterator first, HostIterator last, DeviceIterator result, command_queue &queue) { typedef typename std::iterator_traits::value_type value_type; typedef typename std::iterator_traits::difference_type difference_type; size_t count = iterator_range_size(first, last); if(count == 0){ return result; } size_t offset = result.get_index(); // map result buffer to host value_type *pointer = static_cast( queue.enqueue_map_buffer( result.get_buffer(), CL_MAP_WRITE, offset * sizeof(value_type), count * sizeof(value_type) ) ); // copy [first; last) to result buffer std::copy(first, last, pointer); // unmap result buffer boost::compute::event unmap_event = queue.enqueue_unmap_buffer( result.get_buffer(), static_cast(pointer) ); unmap_event.wait(); return result + static_cast(count); } template inline future copy_to_device_async(HostIterator first, HostIterator last, DeviceIterator result, command_queue &queue) { typedef typename std::iterator_traits::value_type value_type; typedef typename std::iterator_traits::difference_type difference_type; size_t count = iterator_range_size(first, last); if(count == 0){ return future(); } size_t offset = result.get_index(); event event_ = queue.enqueue_write_buffer_async(result.get_buffer(), offset * sizeof(value_type), count * sizeof(value_type), ::boost::addressof(*first)); return make_future(result + static_cast(count), event_); } #ifdef CL_VERSION_2_0 // copy_to_device() specialization for svm_ptr template inline svm_ptr copy_to_device(HostIterator first, HostIterator last, svm_ptr result, command_queue &queue) { size_t count = iterator_range_size(first, last); if(count == 0){ return result; } queue.enqueue_svm_memcpy( result.get(), ::boost::addressof(*first), count * sizeof(T) ); return result + count; } template inline future > copy_to_device_async(HostIterator first, HostIterator last, svm_ptr result, command_queue &queue) { size_t count = iterator_range_size(first, last); if(count == 0){ return future >(); } event event_ = queue.enqueue_svm_memcpy_async( result.get(), ::boost::addressof(*first), count * sizeof(T) ); return make_future(result + count, event_); } template inline svm_ptr copy_to_device_map(HostIterator first, HostIterator last, svm_ptr result, command_queue &queue) { size_t count = iterator_range_size(first, last); if(count == 0){ return result; } // map queue.enqueue_svm_map(result.get(), count * sizeof(T), CL_MAP_WRITE); // copy [first; last) to result buffer std::copy(first, last, static_cast(result.get())); // unmap result queue.enqueue_svm_unmap(result.get()).wait(); return result + count; } #endif // CL_VERSION_2_0 } // end detail namespace } // end compute namespace } // end boost namespace #endif // BOOST_COMPUTE_ALGORITHM_DETAIL_COPY_TO_DEVICE_HPP