43 lines
1.2 KiB
Plaintext
43 lines
1.2 KiB
Plaintext
//---------------------------------------------------------------------------//
|
|
// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
|
|
//
|
|
// Distributed under the Boost Software License, Version 1.0
|
|
// See accompanying file LICENSE_1_0.txt or copy at
|
|
// http://www.boost.org/LICENSE_1_0.txt
|
|
//
|
|
// See http://boostorg.github.com/compute for more information.
|
|
//---------------------------------------------------------------------------//
|
|
|
|
#ifndef BOOST_COMPUTE_FUNCTIONAL_DETAIL_NVIDIA_POPCOUNT_HPP
|
|
#define BOOST_COMPUTE_FUNCTIONAL_DETAIL_NVIDIA_POPCOUNT_HPP
|
|
|
|
#include <boost/compute/function.hpp>
|
|
|
|
namespace boost {
|
|
namespace compute {
|
|
namespace detail {
|
|
|
|
template<class T>
|
|
class nvidia_popcount : public function<T(T)>
|
|
{
|
|
public:
|
|
nvidia_popcount()
|
|
: function<T(T)>("nvidia_popcount")
|
|
{
|
|
this->set_source(
|
|
"inline uint nvidia_popcount(const uint x)\n"
|
|
"{\n"
|
|
" uint count;\n"
|
|
" asm(\"popc.b32 %0, %1;\" : \"=r\"(count) : \"r\"(x));\n"
|
|
" return count;\n"
|
|
"}\n"
|
|
);
|
|
}
|
|
};
|
|
|
|
} // end detail namespace
|
|
} // end compute namespace
|
|
} // end boost namespace
|
|
|
|
#endif // BOOST_COMPUTE_FUNCTIONAL_DETAIL_NVIDIA_POPCOUNT_HPP
|