120 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
		
		
			
		
	
	
			120 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| 
								 | 
							
								//---------------------------------------------------------------------------//
							 | 
						||
| 
								 | 
							
								// Copyright (c) 2015 Jakub Szuppe <j.szuppe@gmail.com>
							 | 
						||
| 
								 | 
							
								//
							 | 
						||
| 
								 | 
							
								// Distributed under the Boost Software License, Version 1.0
							 | 
						||
| 
								 | 
							
								// See accompanying file LICENSE_1_0.txt or copy at
							 | 
						||
| 
								 | 
							
								// http://www.boost.org/LICENSE_1_0.txt
							 | 
						||
| 
								 | 
							
								//
							 | 
						||
| 
								 | 
							
								// See http://boostorg.github.com/compute for more information.
							 | 
						||
| 
								 | 
							
								//---------------------------------------------------------------------------//
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#ifndef BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP
							 | 
						||
| 
								 | 
							
								#define BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <algorithm>
							 | 
						||
| 
								 | 
							
								#include <iterator>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <boost/compute/command_queue.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/functional.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/container/vector.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/detail/iterator_range_size.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/algorithm/detail/serial_reduce_by_key.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/algorithm/detail/reduce_by_key_with_scan.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/type_traits.hpp>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								namespace boost {
							 | 
						||
| 
								 | 
							
								namespace compute {
							 | 
						||
| 
								 | 
							
								namespace detail {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								template<class InputKeyIterator, class InputValueIterator,
							 | 
						||
| 
								 | 
							
								         class OutputKeyIterator, class OutputValueIterator,
							 | 
						||
| 
								 | 
							
								         class BinaryFunction, class BinaryPredicate>
							 | 
						||
| 
								 | 
							
								size_t reduce_by_key_on_gpu(InputKeyIterator keys_first,
							 | 
						||
| 
								 | 
							
								                            InputKeyIterator keys_last,
							 | 
						||
| 
								 | 
							
								                            InputValueIterator values_first,
							 | 
						||
| 
								 | 
							
								                            OutputKeyIterator keys_result,
							 | 
						||
| 
								 | 
							
								                            OutputValueIterator values_result,
							 | 
						||
| 
								 | 
							
								                            BinaryFunction function,
							 | 
						||
| 
								 | 
							
								                            BinaryPredicate predicate,
							 | 
						||
| 
								 | 
							
								                            command_queue &queue)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
								    return detail::reduce_by_key_with_scan(keys_first, keys_last, values_first,
							 | 
						||
| 
								 | 
							
								                                           keys_result, values_result, function,
							 | 
						||
| 
								 | 
							
								                                           predicate, queue);
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								template<class InputKeyIterator, class InputValueIterator,
							 | 
						||
| 
								 | 
							
								         class OutputKeyIterator, class OutputValueIterator>
							 | 
						||
| 
								 | 
							
								bool reduce_by_key_on_gpu_requirements_met(InputKeyIterator keys_first,
							 | 
						||
| 
								 | 
							
								                                           InputValueIterator values_first,
							 | 
						||
| 
								 | 
							
								                                           OutputKeyIterator keys_result,
							 | 
						||
| 
								 | 
							
								                                           OutputValueIterator values_result,
							 | 
						||
| 
								 | 
							
								                                           const size_t count,
							 | 
						||
| 
								 | 
							
								                                           command_queue &queue)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
								    const device &device = queue.get_device();
							 | 
						||
| 
								 | 
							
								    return (count > 256)
							 | 
						||
| 
								 | 
							
								               && !(device.type() & device::cpu)
							 | 
						||
| 
								 | 
							
								               && reduce_by_key_with_scan_requirements_met(keys_first, values_first,
							 | 
						||
| 
								 | 
							
								                                                           keys_result,values_result,
							 | 
						||
| 
								 | 
							
								                                                           count, queue);
							 | 
						||
| 
								 | 
							
								    return true;
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								template<class InputKeyIterator, class InputValueIterator,
							 | 
						||
| 
								 | 
							
								         class OutputKeyIterator, class OutputValueIterator,
							 | 
						||
| 
								 | 
							
								         class BinaryFunction, class BinaryPredicate>
							 | 
						||
| 
								 | 
							
								inline std::pair<OutputKeyIterator, OutputValueIterator>
							 | 
						||
| 
								 | 
							
								dispatch_reduce_by_key(InputKeyIterator keys_first,
							 | 
						||
| 
								 | 
							
								                       InputKeyIterator keys_last,
							 | 
						||
| 
								 | 
							
								                       InputValueIterator values_first,
							 | 
						||
| 
								 | 
							
								                       OutputKeyIterator keys_result,
							 | 
						||
| 
								 | 
							
								                       OutputValueIterator values_result,
							 | 
						||
| 
								 | 
							
								                       BinaryFunction function,
							 | 
						||
| 
								 | 
							
								                       BinaryPredicate predicate,
							 | 
						||
| 
								 | 
							
								                       command_queue &queue)
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
								    typedef typename
							 | 
						||
| 
								 | 
							
								        std::iterator_traits<OutputKeyIterator>::difference_type key_difference_type;
							 | 
						||
| 
								 | 
							
								    typedef typename
							 | 
						||
| 
								 | 
							
								        std::iterator_traits<OutputValueIterator>::difference_type value_difference_type;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    const size_t count = detail::iterator_range_size(keys_first, keys_last);
							 | 
						||
| 
								 | 
							
								    if (count < 2) {
							 | 
						||
| 
								 | 
							
								        boost::compute::copy_n(keys_first, count, keys_result, queue);
							 | 
						||
| 
								 | 
							
								        boost::compute::copy_n(values_first, count, values_result, queue);
							 | 
						||
| 
								 | 
							
								        return
							 | 
						||
| 
								 | 
							
								            std::make_pair<OutputKeyIterator, OutputValueIterator>(
							 | 
						||
| 
								 | 
							
								                keys_result + static_cast<key_difference_type>(count),
							 | 
						||
| 
								 | 
							
								                values_result + static_cast<value_difference_type>(count)
							 | 
						||
| 
								 | 
							
								            );
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    size_t result_size = 0;
							 | 
						||
| 
								 | 
							
								    if(reduce_by_key_on_gpu_requirements_met(keys_first, values_first, keys_result,
							 | 
						||
| 
								 | 
							
								                                             values_result, count, queue)){
							 | 
						||
| 
								 | 
							
								        result_size =
							 | 
						||
| 
								 | 
							
								            detail::reduce_by_key_on_gpu(keys_first, keys_last, values_first,
							 | 
						||
| 
								 | 
							
								                                         keys_result, values_result, function,
							 | 
						||
| 
								 | 
							
								                                         predicate, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								    else {
							 | 
						||
| 
								 | 
							
								        result_size =
							 | 
						||
| 
								 | 
							
								              detail::serial_reduce_by_key(keys_first, keys_last, values_first,
							 | 
						||
| 
								 | 
							
								                                           keys_result, values_result, function,
							 | 
						||
| 
								 | 
							
								                                           predicate, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    return
							 | 
						||
| 
								 | 
							
								        std::make_pair<OutputKeyIterator, OutputValueIterator>(
							 | 
						||
| 
								 | 
							
								            keys_result + static_cast<key_difference_type>(result_size),
							 | 
						||
| 
								 | 
							
								            values_result + static_cast<value_difference_type>(result_size)
							 | 
						||
| 
								 | 
							
								        );
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								} // end detail namespace
							 | 
						||
| 
								 | 
							
								} // end compute namespace
							 | 
						||
| 
								 | 
							
								} // end boost namespace
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#endif // BOOST_COMPUTE_ALGORITHM_DETAIL_REDUCE_BY_KEY_HPP
							 |