| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168 | // Copyright (C) 2005-2006 Douglas Gregor <doug.gregor@gmail.com>.// Copyright (C) 2004 The Trustees of Indiana University// Use, modification and distribution is subject to the Boost Software// License, Version 1.0. (See accompanying file LICENSE_1_0.txt or copy at// http://www.boost.org/LICENSE_1_0.txt)//   Authors: Douglas Gregor//            Andrew Lumsdaine// Message Passing Interface 1.1 -- Section 4.9.1. Scan#ifndef BOOST_MPI_SCAN_HPP#define BOOST_MPI_SCAN_HPP#include <boost/mpi/exception.hpp>#include <boost/mpi/datatype.hpp>// For (de-)serializing sends and receives#include <boost/mpi/packed_oarchive.hpp>#include <boost/mpi/packed_iarchive.hpp>// For packed_[io]archive sends and receives#include <boost/mpi/detail/point_to_point.hpp>#include <boost/mpi/communicator.hpp>#include <boost/mpi/environment.hpp>#include <boost/mpi/detail/computation_tree.hpp>#include <boost/mpi/operations.hpp>#include <algorithm>#include <exception>#include <boost/assert.hpp>namespace boost { namespace mpi {/************************************************************************ * Implementation details                                               * ************************************************************************/namespace detail {  /**********************************************************************   * Simple prefix reduction with MPI_Scan                              *   **********************************************************************/  // We are performing prefix reduction for a type that has an  // associated MPI datatype and operation, so we'll use MPI_Scan  // directly.  template<typename T, typename Op>  void  scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,            Op /*op*/, mpl::true_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)  {    BOOST_MPI_CHECK_RESULT(MPI_Scan,                           (const_cast<T*>(in_values), out_values, n,                            boost::mpi::get_mpi_datatype<T>(*in_values),                            (is_mpi_op<Op, T>::op()), comm));  }  /**********************************************************************   * User-defined prefix reduction with MPI_Scan                        *   **********************************************************************/  // We are performing prefix reduction for a type that has an  // associated MPI datatype but with a custom operation. We'll use  // MPI_Scan directly, but we'll need to create an MPI_Op manually.  template<typename T, typename Op>  void  scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,            Op op, mpl::false_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)  {    user_op<Op, T> mpi_op;    BOOST_MPI_CHECK_RESULT(MPI_Scan,                           (const_cast<T*>(in_values), out_values, n,                            boost::mpi::get_mpi_datatype<T>(*in_values),                            mpi_op.get_mpi_op(), comm));  }  /**********************************************************************   * User-defined, tree-based reduction for non-MPI data types          *   **********************************************************************/  template<typename T, typename Op>  void  upper_lower_scan(const communicator& comm, const T* in_values, int n,                   T* out_values, Op& op, int lower, int upper)  {    int tag = environment::collectives_tag();    int rank = comm.rank();    if (lower + 1 == upper) {      std::copy(in_values, in_values + n, out_values);    } else {      int middle = (lower + upper) / 2;            if (rank < middle) {        // Lower half        upper_lower_scan(comm, in_values, n, out_values, op, lower, middle);        // If we're the last process in the lower half, send our values        // to everyone in the upper half.        if (rank == middle - 1) {          packed_oarchive oa(comm);          for (int i = 0; i < n; ++i)            oa << out_values[i];          for (int p = middle; p < upper; ++p)            comm.send(p, tag, oa);        }      } else {        // Upper half        upper_lower_scan(comm, in_values, n, out_values, op, middle, upper);        // Receive value from the last process in the lower half.        packed_iarchive ia(comm);        comm.recv(middle - 1, tag, ia);        // Combine value that came from the left with our value        T left_value;        for (int i = 0; i < n; ++i)          {            ia >> left_value;            out_values[i] = op(left_value, out_values[i]);          }      }    }  }  // We are performing prefix reduction for a type that has no  // associated MPI datatype and operation, so we'll use a simple  // upper/lower algorithm.  template<typename T, typename Op>  inline void  scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,             Op op, mpl::false_ /*is_mpi_op*/, mpl::false_/*is_mpi_datatype*/)  {    upper_lower_scan(comm, in_values, n, out_values, op, 0, comm.size());  }} // end namespace detailtemplate<typename T, typename Op>inline voidscan(const communicator& comm, const T& in_value, T& out_value, Op op){  detail::scan_impl(comm, &in_value, 1, &out_value, op,                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());}template<typename T, typename Op>inline voidscan(const communicator& comm, const T* in_values, int n, T* out_values, Op op){  detail::scan_impl(comm, in_values, n, out_values, op,                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());}template<typename T, typename Op>inline Tscan(const communicator& comm, const T& in_value, Op op){  T out_value;  detail::scan_impl(comm, &in_value, 1, &out_value, op,                     is_mpi_op<Op, T>(), is_mpi_datatype<T>());  return out_value;}} } // end namespace boost::mpi#endif // BOOST_MPI_SCAN_HPP
 |