169 lines
		
	
	
		
			5.9 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			169 lines
		
	
	
		
			5.9 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| // Copyright (C) 2005-2006 Douglas Gregor <doug.gregor@gmail.com>.
 | |
| // Copyright (C) 2004 The Trustees of Indiana University
 | |
| 
 | |
| // Use, modification and distribution is subject to the Boost Software
 | |
| // License, Version 1.0. (See accompanying file LICENSE_1_0.txt or copy at
 | |
| // http://www.boost.org/LICENSE_1_0.txt)
 | |
| 
 | |
| //   Authors: Douglas Gregor
 | |
| //            Andrew Lumsdaine
 | |
| 
 | |
| // Message Passing Interface 1.1 -- Section 4.9.1. Scan
 | |
| #ifndef BOOST_MPI_SCAN_HPP
 | |
| #define BOOST_MPI_SCAN_HPP
 | |
| 
 | |
| #include <boost/mpi/exception.hpp>
 | |
| #include <boost/mpi/datatype.hpp>
 | |
| 
 | |
| // For (de-)serializing sends and receives
 | |
| #include <boost/mpi/packed_oarchive.hpp>
 | |
| #include <boost/mpi/packed_iarchive.hpp>
 | |
| 
 | |
| // For packed_[io]archive sends and receives
 | |
| #include <boost/mpi/detail/point_to_point.hpp>
 | |
| 
 | |
| #include <boost/mpi/communicator.hpp>
 | |
| #include <boost/mpi/environment.hpp>
 | |
| #include <boost/mpi/detail/computation_tree.hpp>
 | |
| #include <boost/mpi/operations.hpp>
 | |
| #include <algorithm>
 | |
| #include <exception>
 | |
| #include <boost/assert.hpp>
 | |
| 
 | |
| namespace boost { namespace mpi {
 | |
| 
 | |
| 
 | |
| /************************************************************************
 | |
|  * Implementation details                                               *
 | |
|  ************************************************************************/
 | |
| namespace detail {
 | |
|   /**********************************************************************
 | |
|    * Simple prefix reduction with MPI_Scan                              *
 | |
|    **********************************************************************/
 | |
| 
 | |
|   // We are performing prefix reduction for a type that has an
 | |
|   // associated MPI datatype and operation, so we'll use MPI_Scan
 | |
|   // directly.
 | |
|   template<typename T, typename Op>
 | |
|   void
 | |
|   scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,
 | |
|             Op /*op*/, mpl::true_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)
 | |
|   {
 | |
|     BOOST_MPI_CHECK_RESULT(MPI_Scan,
 | |
|                            (const_cast<T*>(in_values), out_values, n,
 | |
|                             boost::mpi::get_mpi_datatype<T>(*in_values),
 | |
|                             (is_mpi_op<Op, T>::op()), comm));
 | |
|   }
 | |
| 
 | |
|   /**********************************************************************
 | |
|    * User-defined prefix reduction with MPI_Scan                        *
 | |
|    **********************************************************************/
 | |
| 
 | |
|   // We are performing prefix reduction for a type that has an
 | |
|   // associated MPI datatype but with a custom operation. We'll use
 | |
|   // MPI_Scan directly, but we'll need to create an MPI_Op manually.
 | |
|   template<typename T, typename Op>
 | |
|   void
 | |
|   scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,
 | |
|             Op op, mpl::false_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)
 | |
|   {
 | |
|     user_op<Op, T> mpi_op(op);
 | |
|     BOOST_MPI_CHECK_RESULT(MPI_Scan,
 | |
|                            (const_cast<T*>(in_values), out_values, n,
 | |
|                             boost::mpi::get_mpi_datatype<T>(*in_values),
 | |
|                             mpi_op.get_mpi_op(), comm));
 | |
|   }
 | |
| 
 | |
|   /**********************************************************************
 | |
|    * User-defined, tree-based reduction for non-MPI data types          *
 | |
|    **********************************************************************/
 | |
| 
 | |
|   template<typename T, typename Op>
 | |
|   void
 | |
|   upper_lower_scan(const communicator& comm, const T* in_values, int n,
 | |
|                    T* out_values, Op& op, int lower, int upper)
 | |
|   {
 | |
|     int tag = environment::collectives_tag();
 | |
|     int rank = comm.rank();
 | |
| 
 | |
|     if (lower + 1 == upper) {
 | |
|       std::copy(in_values, in_values + n, out_values);
 | |
|     } else {
 | |
|       int middle = (lower + upper) / 2;
 | |
|       
 | |
|       if (rank < middle) {
 | |
|         // Lower half
 | |
|         upper_lower_scan(comm, in_values, n, out_values, op, lower, middle);
 | |
| 
 | |
|         // If we're the last process in the lower half, send our values
 | |
|         // to everyone in the upper half.
 | |
|         if (rank == middle - 1) {
 | |
|           packed_oarchive oa(comm);
 | |
|           for (int i = 0; i < n; ++i)
 | |
|             oa << out_values[i];
 | |
| 
 | |
|           for (int p = middle; p < upper; ++p)
 | |
|             comm.send(p, tag, oa);
 | |
|         }
 | |
|       } else {
 | |
|         // Upper half
 | |
|         upper_lower_scan(comm, in_values, n, out_values, op, middle, upper);
 | |
| 
 | |
|         // Receive value from the last process in the lower half.
 | |
|         packed_iarchive ia(comm);
 | |
|         comm.recv(middle - 1, tag, ia);
 | |
| 
 | |
|         // Combine value that came from the left with our value
 | |
|         T left_value;
 | |
|         for (int i = 0; i < n; ++i)
 | |
|           {
 | |
|             ia >> left_value;
 | |
|             out_values[i] = op(left_value, out_values[i]);
 | |
|           }
 | |
|       }
 | |
|     }
 | |
|   }
 | |
| 
 | |
|   // We are performing prefix reduction for a type that has no
 | |
|   // associated MPI datatype and operation, so we'll use a simple
 | |
|   // upper/lower algorithm.
 | |
|   template<typename T, typename Op>
 | |
|   inline void
 | |
|   scan_impl(const communicator& comm, const T* in_values, int n, T* out_values, 
 | |
|             Op op, mpl::false_ /*is_mpi_op*/, mpl::false_/*is_mpi_datatype*/)
 | |
|   {
 | |
|     upper_lower_scan(comm, in_values, n, out_values, op, 0, comm.size());
 | |
|   }
 | |
| } // end namespace detail
 | |
| 
 | |
| 
 | |
| template<typename T, typename Op>
 | |
| inline void
 | |
| scan(const communicator& comm, const T& in_value, T& out_value, Op op)
 | |
| {
 | |
|   detail::scan_impl(comm, &in_value, 1, &out_value, op, 
 | |
|                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());
 | |
| }
 | |
| 
 | |
| template<typename T, typename Op>
 | |
| inline void
 | |
| scan(const communicator& comm, const T* in_values, int n, T* out_values, Op op)
 | |
| {
 | |
|   detail::scan_impl(comm, in_values, n, out_values, op, 
 | |
|                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());
 | |
| }
 | |
| 
 | |
| template<typename T, typename Op>
 | |
| inline T
 | |
| scan(const communicator& comm, const T& in_value, Op op)
 | |
| {
 | |
|   T out_value;
 | |
|   detail::scan_impl(comm, &in_value, 1, &out_value, op, 
 | |
|                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());
 | |
|   return out_value;
 | |
| }
 | |
| 
 | |
| } } // end namespace boost::mpi
 | |
| 
 | |
| #endif // BOOST_MPI_SCAN_HPP
 | 
