120 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
		
		
			
		
	
	
			120 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
|   | //---------------------------------------------------------------------------// | ||
|  | // Copyright (c) 2015 Jakub Szuppe <j.szuppe@gmail.com> | ||
|  | // | ||
|  | // Distributed under the Boost Software License, Version 1.0 | ||
|  | // See accompanying file LICENSE_1_0.txt or copy at | ||
|  | // http://www.boost.org/LICENSE_1_0.txt | ||
|  | // | ||
|  | // See http://boostorg.github.com/compute for more information. | ||
|  | //---------------------------------------------------------------------------// | ||
|  | 
 | ||
|  | #ifndef BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP | ||
|  | #define BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP | ||
|  | 
 | ||
|  | #include <algorithm> | ||
|  | #include <iterator> | ||
|  | 
 | ||
|  | #include <boost/compute/command_queue.hpp> | ||
|  | #include <boost/compute/functional.hpp> | ||
|  | #include <boost/compute/container/vector.hpp> | ||
|  | #include <boost/compute/detail/iterator_range_size.hpp> | ||
|  | #include <boost/compute/algorithm/detail/serial_reduce_by_key.hpp> | ||
|  | #include <boost/compute/algorithm/detail/reduce_by_key_with_scan.hpp> | ||
|  | #include <boost/compute/type_traits.hpp> | ||
|  | 
 | ||
|  | namespace boost { | ||
|  | namespace compute { | ||
|  | namespace detail { | ||
|  | 
 | ||
|  | template<class InputKeyIterator, class InputValueIterator, | ||
|  |          class OutputKeyIterator, class OutputValueIterator, | ||
|  |          class BinaryFunction, class BinaryPredicate> | ||
|  | size_t reduce_by_key_on_gpu(InputKeyIterator keys_first, | ||
|  |                             InputKeyIterator keys_last, | ||
|  |                             InputValueIterator values_first, | ||
|  |                             OutputKeyIterator keys_result, | ||
|  |                             OutputValueIterator values_result, | ||
|  |                             BinaryFunction function, | ||
|  |                             BinaryPredicate predicate, | ||
|  |                             command_queue &queue) | ||
|  | { | ||
|  |     return detail::reduce_by_key_with_scan(keys_first, keys_last, values_first, | ||
|  |                                            keys_result, values_result, function, | ||
|  |                                            predicate, queue); | ||
|  | } | ||
|  | 
 | ||
|  | template<class InputKeyIterator, class InputValueIterator, | ||
|  |          class OutputKeyIterator, class OutputValueIterator> | ||
|  | bool reduce_by_key_on_gpu_requirements_met(InputKeyIterator keys_first, | ||
|  |                                            InputValueIterator values_first, | ||
|  |                                            OutputKeyIterator keys_result, | ||
|  |                                            OutputValueIterator values_result, | ||
|  |                                            const size_t count, | ||
|  |                                            command_queue &queue) | ||
|  | { | ||
|  |     const device &device = queue.get_device(); | ||
|  |     return (count > 256) | ||
|  |                && !(device.type() & device::cpu) | ||
|  |                && reduce_by_key_with_scan_requirements_met(keys_first, values_first, | ||
|  |                                                            keys_result,values_result, | ||
|  |                                                            count, queue); | ||
|  |     return true; | ||
|  | } | ||
|  | 
 | ||
|  | template<class InputKeyIterator, class InputValueIterator, | ||
|  |          class OutputKeyIterator, class OutputValueIterator, | ||
|  |          class BinaryFunction, class BinaryPredicate> | ||
|  | inline std::pair<OutputKeyIterator, OutputValueIterator> | ||
|  | dispatch_reduce_by_key(InputKeyIterator keys_first, | ||
|  |                        InputKeyIterator keys_last, | ||
|  |                        InputValueIterator values_first, | ||
|  |                        OutputKeyIterator keys_result, | ||
|  |                        OutputValueIterator values_result, | ||
|  |                        BinaryFunction function, | ||
|  |                        BinaryPredicate predicate, | ||
|  |                        command_queue &queue) | ||
|  | { | ||
|  |     typedef typename | ||
|  |         std::iterator_traits<OutputKeyIterator>::difference_type key_difference_type; | ||
|  |     typedef typename | ||
|  |         std::iterator_traits<OutputValueIterator>::difference_type value_difference_type; | ||
|  | 
 | ||
|  |     const size_t count = detail::iterator_range_size(keys_first, keys_last); | ||
|  |     if (count < 2) { | ||
|  |         boost::compute::copy_n(keys_first, count, keys_result, queue); | ||
|  |         boost::compute::copy_n(values_first, count, values_result, queue); | ||
|  |         return | ||
|  |             std::make_pair<OutputKeyIterator, OutputValueIterator>( | ||
|  |                 keys_result + static_cast<key_difference_type>(count), | ||
|  |                 values_result + static_cast<value_difference_type>(count) | ||
|  |             ); | ||
|  |     } | ||
|  | 
 | ||
|  |     size_t result_size = 0; | ||
|  |     if(reduce_by_key_on_gpu_requirements_met(keys_first, values_first, keys_result, | ||
|  |                                              values_result, count, queue)){ | ||
|  |         result_size = | ||
|  |             detail::reduce_by_key_on_gpu(keys_first, keys_last, values_first, | ||
|  |                                          keys_result, values_result, function, | ||
|  |                                          predicate, queue); | ||
|  |     } | ||
|  |     else { | ||
|  |         result_size = | ||
|  |               detail::serial_reduce_by_key(keys_first, keys_last, values_first, | ||
|  |                                            keys_result, values_result, function, | ||
|  |                                            predicate, queue); | ||
|  |     } | ||
|  | 
 | ||
|  |     return | ||
|  |         std::make_pair<OutputKeyIterator, OutputValueIterator>( | ||
|  |             keys_result + static_cast<key_difference_type>(result_size), | ||
|  |             values_result + static_cast<value_difference_type>(result_size) | ||
|  |         ); | ||
|  | } | ||
|  | 
 | ||
|  | } // end detail namespace | ||
|  | } // end compute namespace | ||
|  | } // end boost namespace | ||
|  | 
 | ||
|  | #endif // BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP |