239 lines
		
	
	
		
			7.6 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
		
		
			
		
	
	
			239 lines
		
	
	
		
			7.6 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| 
								 | 
							
								//---------------------------------------------------------------------------//
							 | 
						||
| 
								 | 
							
								// Copyright (c) 2014 Roshan <thisisroshansmail@gmail.com>
							 | 
						||
| 
								 | 
							
								//
							 | 
						||
| 
								 | 
							
								// Distributed under the Boost Software License, Version 1.0
							 | 
						||
| 
								 | 
							
								// See accompanying file LICENSE_1_0.txt or copy at
							 | 
						||
| 
								 | 
							
								// http://www.boost.org/LICENSE_1_0.txt
							 | 
						||
| 
								 | 
							
								//
							 | 
						||
| 
								 | 
							
								// See http://boostorg.github.com/compute for more information.
							 | 
						||
| 
								 | 
							
								//---------------------------------------------------------------------------//
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#ifndef BOOST_COMPUTE_RANDOM_LINEAR_CONGRUENTIAL_ENGINE_HPP
							 | 
						||
| 
								 | 
							
								#define BOOST_COMPUTE_RANDOM_LINEAR_CONGRUENTIAL_ENGINE_HPP
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <algorithm>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include <boost/compute/types.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/buffer.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/kernel.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/context.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/program.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/command_queue.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/algorithm/transform.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/container/vector.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/detail/iterator_range_size.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/iterator/discard_iterator.hpp>
							 | 
						||
| 
								 | 
							
								#include <boost/compute/utility/program_cache.hpp>
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								namespace boost {
							 | 
						||
| 
								 | 
							
								namespace compute {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								///
							 | 
						||
| 
								 | 
							
								/// \class linear_congruential_engine
							 | 
						||
| 
								 | 
							
								/// \brief 'Quick and Dirty' linear congruential engine
							 | 
						||
| 
								 | 
							
								///
							 | 
						||
| 
								 | 
							
								/// Quick and dirty linear congruential engine to generate low quality
							 | 
						||
| 
								 | 
							
								/// random numbers very quickly. For uses in which good quality of random
							 | 
						||
| 
								 | 
							
								/// numbers is required(Monte-Carlo Simulations), use other engines like
							 | 
						||
| 
								 | 
							
								/// Mersenne Twister instead.
							 | 
						||
| 
								 | 
							
								///
							 | 
						||
| 
								 | 
							
								template<class T = uint_>
							 | 
						||
| 
								 | 
							
								class linear_congruential_engine
							 | 
						||
| 
								 | 
							
								{
							 | 
						||
| 
								 | 
							
								public:
							 | 
						||
| 
								 | 
							
								    typedef T result_type;
							 | 
						||
| 
								 | 
							
								    static const T default_seed = 1;
							 | 
						||
| 
								 | 
							
								    static const T a = 1099087573;
							 | 
						||
| 
								 | 
							
								    static const size_t threads = 1024;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Creates a new linear_congruential_engine and seeds it with \p value.
							 | 
						||
| 
								 | 
							
								    explicit linear_congruential_engine(command_queue &queue,
							 | 
						||
| 
								 | 
							
								                                        result_type value = default_seed)
							 | 
						||
| 
								 | 
							
								        : m_context(queue.get_context()),
							 | 
						||
| 
								 | 
							
								          m_multiplicands(m_context, threads * sizeof(result_type))
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        // setup program
							 | 
						||
| 
								 | 
							
								        load_program();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        // seed state
							 | 
						||
| 
								 | 
							
								        seed(value, queue);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        // generate multiplicands
							 | 
						||
| 
								 | 
							
								        generate_multiplicands(queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Creates a new linear_congruential_engine object as a copy of \p other.
							 | 
						||
| 
								 | 
							
								    linear_congruential_engine(const linear_congruential_engine<T> &other)
							 | 
						||
| 
								 | 
							
								        : m_context(other.m_context),
							 | 
						||
| 
								 | 
							
								          m_program(other.m_program),
							 | 
						||
| 
								 | 
							
								          m_seed(other.m_seed),
							 | 
						||
| 
								 | 
							
								          m_multiplicands(other.m_multiplicands)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Copies \p other to \c *this.
							 | 
						||
| 
								 | 
							
								    linear_congruential_engine<T>&
							 | 
						||
| 
								 | 
							
								    operator=(const linear_congruential_engine<T> &other)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        if(this != &other){
							 | 
						||
| 
								 | 
							
								            m_context = other.m_context;
							 | 
						||
| 
								 | 
							
								            m_program = other.m_program;
							 | 
						||
| 
								 | 
							
								            m_seed = other.m_seed;
							 | 
						||
| 
								 | 
							
								            m_multiplicands = other.m_multiplicands;
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return *this;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Destroys the linear_congruential_engine object.
							 | 
						||
| 
								 | 
							
								    ~linear_congruential_engine()
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Seeds the random number generator with \p value.
							 | 
						||
| 
								 | 
							
								    ///
							 | 
						||
| 
								 | 
							
								    /// \param value seed value for the random-number generator
							 | 
						||
| 
								 | 
							
								    /// \param queue command queue to perform the operation
							 | 
						||
| 
								 | 
							
								    ///
							 | 
						||
| 
								 | 
							
								    /// If no seed value is provided, \c default_seed is used.
							 | 
						||
| 
								 | 
							
								    void seed(result_type value, command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        (void) queue;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        m_seed = value;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// \overload
							 | 
						||
| 
								 | 
							
								    void seed(command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        seed(default_seed, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Generates random numbers and stores them to the range [\p first, \p last).
							 | 
						||
| 
								 | 
							
								    template<class OutputIterator>
							 | 
						||
| 
								 | 
							
								    void generate(OutputIterator first, OutputIterator last, command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        size_t size = detail::iterator_range_size(first, last);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        kernel fill_kernel(m_program, "fill");
							 | 
						||
| 
								 | 
							
								        fill_kernel.set_arg(1, m_multiplicands);
							 | 
						||
| 
								 | 
							
								        fill_kernel.set_arg(2, first.get_buffer());
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        size_t offset = 0;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        for(;;){
							 | 
						||
| 
								 | 
							
								            size_t count = 0;
							 | 
						||
| 
								 | 
							
								            if(size > threads){
							 | 
						||
| 
								 | 
							
								                count = (std::min)(static_cast<size_t>(threads), size - offset);
							 | 
						||
| 
								 | 
							
								            }
							 | 
						||
| 
								 | 
							
								            else {
							 | 
						||
| 
								 | 
							
								                count = size;
							 | 
						||
| 
								 | 
							
								            }
							 | 
						||
| 
								 | 
							
								            fill_kernel.set_arg(0, static_cast<const uint_>(m_seed));
							 | 
						||
| 
								 | 
							
								            fill_kernel.set_arg(3, static_cast<const uint_>(offset));
							 | 
						||
| 
								 | 
							
								            queue.enqueue_1d_range_kernel(fill_kernel, 0, count, 0);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								            offset += count;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								            if(offset >= size){
							 | 
						||
| 
								 | 
							
								                break;
							 | 
						||
| 
								 | 
							
								            }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								            update_seed(queue);
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// \internal_
							 | 
						||
| 
								 | 
							
								    void generate(discard_iterator first, discard_iterator last, command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        (void) queue;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        size_t size = detail::iterator_range_size(first, last);
							 | 
						||
| 
								 | 
							
								        uint_ max_mult =
							 | 
						||
| 
								 | 
							
								            detail::read_single_value<T>(m_multiplicands, threads-1, queue);
							 | 
						||
| 
								 | 
							
								        while(size >= threads) {
							 | 
						||
| 
								 | 
							
								            m_seed *= max_mult;
							 | 
						||
| 
								 | 
							
								            size -= threads;
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								        m_seed *=
							 | 
						||
| 
								 | 
							
								            detail::read_single_value<T>(m_multiplicands, size-1, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Generates random numbers, transforms them with \p op, and then stores
							 | 
						||
| 
								 | 
							
								    /// them to the range [\p first, \p last).
							 | 
						||
| 
								 | 
							
								    template<class OutputIterator, class Function>
							 | 
						||
| 
								 | 
							
								    void generate(OutputIterator first, OutputIterator last, Function op, command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        vector<T> tmp(std::distance(first, last), queue.get_context());
							 | 
						||
| 
								 | 
							
								        generate(tmp.begin(), tmp.end(), queue);
							 | 
						||
| 
								 | 
							
								        transform(tmp.begin(), tmp.end(), first, op, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// Generates \p z random numbers and discards them.
							 | 
						||
| 
								 | 
							
								    void discard(size_t z, command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        generate(discard_iterator(0), discard_iterator(z), queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								private:
							 | 
						||
| 
								 | 
							
								    /// \internal_
							 | 
						||
| 
								 | 
							
								    /// Generates the multiplicands for each thread
							 | 
						||
| 
								 | 
							
								    void generate_multiplicands(command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        kernel multiplicand_kernel =
							 | 
						||
| 
								 | 
							
								            m_program.create_kernel("multiplicand");
							 | 
						||
| 
								 | 
							
								        multiplicand_kernel.set_arg(0, m_multiplicands);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        queue.enqueue_task(multiplicand_kernel);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// \internal_
							 | 
						||
| 
								 | 
							
								    void update_seed(command_queue &queue)
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        m_seed *=
							 | 
						||
| 
								 | 
							
								            detail::read_single_value<T>(m_multiplicands, threads-1, queue);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    /// \internal_
							 | 
						||
| 
								 | 
							
								    void load_program()
							 | 
						||
| 
								 | 
							
								    {
							 | 
						||
| 
								 | 
							
								        boost::shared_ptr<program_cache> cache =
							 | 
						||
| 
								 | 
							
								            program_cache::get_global_cache(m_context);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        std::string cache_key =
							 | 
						||
| 
								 | 
							
								            std::string("__boost_linear_congruential_engine_") + type_name<T>();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        const char source[] =
							 | 
						||
| 
								 | 
							
								            "__kernel void multiplicand(__global uint *multiplicands)\n"
							 | 
						||
| 
								 | 
							
								            "{\n"
							 | 
						||
| 
								 | 
							
								            "    uint a = 1099087573;\n"
							 | 
						||
| 
								 | 
							
								            "    multiplicands[0] = a;\n"
							 | 
						||
| 
								 | 
							
								            "    for(uint i = 1; i < 1024; i++){\n"
							 | 
						||
| 
								 | 
							
								            "        multiplicands[i] = a * multiplicands[i-1];\n"
							 | 
						||
| 
								 | 
							
								            "    }\n"
							 | 
						||
| 
								 | 
							
								            "}\n"
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								            "__kernel void fill(const uint seed,\n"
							 | 
						||
| 
								 | 
							
								            "                   __global uint *multiplicands,\n"
							 | 
						||
| 
								 | 
							
								            "                   __global uint *result,"
							 | 
						||
| 
								 | 
							
								            "                   const uint offset)\n"
							 | 
						||
| 
								 | 
							
								            "{\n"
							 | 
						||
| 
								 | 
							
								            "    const uint i = get_global_id(0);\n"
							 | 
						||
| 
								 | 
							
								            "    result[offset+i] = seed * multiplicands[i];\n"
							 | 
						||
| 
								 | 
							
								            "}\n";
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        m_program = cache->get_or_build(cache_key, std::string(), source, m_context);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								private:
							 | 
						||
| 
								 | 
							
								    context m_context;
							 | 
						||
| 
								 | 
							
								    program m_program;
							 | 
						||
| 
								 | 
							
								    T m_seed;
							 | 
						||
| 
								 | 
							
								    buffer m_multiplicands;
							 | 
						||
| 
								 | 
							
								};
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								} // end compute namespace
							 | 
						||
| 
								 | 
							
								} // end boost namespace
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#endif // BOOST_COMPUTE_RANDOM_LINEAR_CONGRUENTIAL_ENGINE_HPP
							 |