98 lines
3.5 KiB
Plaintext
98 lines
3.5 KiB
Plaintext
|
//---------------------------------------------------------------------------//
|
||
|
// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
|
||
|
//
|
||
|
// Distributed under the Boost Software License, Version 1.0
|
||
|
// See accompanying file LICENSE_1_0.txt or copy at
|
||
|
// http://www.boost.org/LICENSE_1_0.txt
|
||
|
//
|
||
|
// See http://boostorg.github.com/compute for more information.
|
||
|
//---------------------------------------------------------------------------//
|
||
|
|
||
|
#ifndef BOOST_COMPUTE_ALGORITHM_SERIAL_MERGE_HPP
|
||
|
#define BOOST_COMPUTE_ALGORITHM_SERIAL_MERGE_HPP
|
||
|
|
||
|
#include <iterator>
|
||
|
|
||
|
#include <boost/compute/command_queue.hpp>
|
||
|
#include <boost/compute/detail/meta_kernel.hpp>
|
||
|
#include <boost/compute/detail/iterator_range_size.hpp>
|
||
|
|
||
|
namespace boost {
|
||
|
namespace compute {
|
||
|
namespace detail {
|
||
|
|
||
|
template<class InputIterator1,
|
||
|
class InputIterator2,
|
||
|
class OutputIterator,
|
||
|
class Compare>
|
||
|
inline OutputIterator serial_merge(InputIterator1 first1,
|
||
|
InputIterator1 last1,
|
||
|
InputIterator2 first2,
|
||
|
InputIterator2 last2,
|
||
|
OutputIterator result,
|
||
|
Compare comp,
|
||
|
command_queue &queue)
|
||
|
{
|
||
|
typedef typename
|
||
|
std::iterator_traits<InputIterator1>::value_type
|
||
|
input_type1;
|
||
|
typedef typename
|
||
|
std::iterator_traits<InputIterator2>::value_type
|
||
|
input_type2;
|
||
|
typedef typename
|
||
|
std::iterator_traits<OutputIterator>::difference_type
|
||
|
result_difference_type;
|
||
|
|
||
|
std::ptrdiff_t size1 = std::distance(first1, last1);
|
||
|
std::ptrdiff_t size2 = std::distance(first2, last2);
|
||
|
|
||
|
meta_kernel k("serial_merge");
|
||
|
k.add_set_arg<uint_>("size1", static_cast<uint_>(size1));
|
||
|
k.add_set_arg<uint_>("size2", static_cast<uint_>(size2));
|
||
|
|
||
|
k <<
|
||
|
"uint i = 0;\n" << // index in result range
|
||
|
"uint j = 0;\n" << // index in first input range
|
||
|
"uint k = 0;\n" << // index in second input range
|
||
|
|
||
|
// fetch initial values from each range
|
||
|
k.decl<input_type1>("j_value") << " = " << first1[0] << ";\n" <<
|
||
|
k.decl<input_type2>("k_value") << " = " << first2[0] << ";\n" <<
|
||
|
|
||
|
// merge values from both input ranges to the result range
|
||
|
"while(j < size1 && k < size2){\n" <<
|
||
|
" if(" << comp(k.var<input_type1>("j_value"),
|
||
|
k.var<input_type2>("k_value")) << "){\n" <<
|
||
|
" " << result[k.var<uint_>("i++")] << " = j_value;\n" <<
|
||
|
" j_value = " << first1[k.var<uint_>("++j")] << ";\n" <<
|
||
|
" }\n" <<
|
||
|
" else{\n"
|
||
|
" " << result[k.var<uint_>("i++")] << " = k_value;\n"
|
||
|
" k_value = " << first2[k.var<uint_>("++k")] << ";\n" <<
|
||
|
" }\n"
|
||
|
"}\n"
|
||
|
|
||
|
// copy any remaining values from first range
|
||
|
"while(j < size1){\n" <<
|
||
|
result[k.var<uint_>("i++")] << " = " <<
|
||
|
first1[k.var<uint_>("j++")] << ";\n" <<
|
||
|
"}\n"
|
||
|
|
||
|
// copy any remaining values from second range
|
||
|
"while(k < size2){\n" <<
|
||
|
result[k.var<uint_>("i++")] << " = " <<
|
||
|
first2[k.var<uint_>("k++")] << ";\n" <<
|
||
|
"}\n";
|
||
|
|
||
|
// run kernel
|
||
|
k.exec(queue);
|
||
|
|
||
|
return result + static_cast<result_difference_type>(size1 + size2);
|
||
|
}
|
||
|
|
||
|
} // end detail namespace
|
||
|
} // end compute namespace
|
||
|
} // end boost namespace
|
||
|
|
||
|
#endif // BOOST_COMPUTE_ALGORITHM_SERIAL_MERGE_HPP
|