169 lines
5.9 KiB
C++
169 lines
5.9 KiB
C++
|
// Copyright (C) 2005-2006 Douglas Gregor <doug.gregor@gmail.com>.
|
||
|
// Copyright (C) 2004 The Trustees of Indiana University
|
||
|
|
||
|
// Use, modification and distribution is subject to the Boost Software
|
||
|
// License, Version 1.0. (See accompanying file LICENSE_1_0.txt or copy at
|
||
|
// http://www.boost.org/LICENSE_1_0.txt)
|
||
|
|
||
|
// Authors: Douglas Gregor
|
||
|
// Andrew Lumsdaine
|
||
|
|
||
|
// Message Passing Interface 1.1 -- Section 4.9.1. Scan
|
||
|
#ifndef BOOST_MPI_SCAN_HPP
|
||
|
#define BOOST_MPI_SCAN_HPP
|
||
|
|
||
|
#include <boost/mpi/exception.hpp>
|
||
|
#include <boost/mpi/datatype.hpp>
|
||
|
|
||
|
// For (de-)serializing sends and receives
|
||
|
#include <boost/mpi/packed_oarchive.hpp>
|
||
|
#include <boost/mpi/packed_iarchive.hpp>
|
||
|
|
||
|
// For packed_[io]archive sends and receives
|
||
|
#include <boost/mpi/detail/point_to_point.hpp>
|
||
|
|
||
|
#include <boost/mpi/communicator.hpp>
|
||
|
#include <boost/mpi/environment.hpp>
|
||
|
#include <boost/mpi/detail/computation_tree.hpp>
|
||
|
#include <boost/mpi/operations.hpp>
|
||
|
#include <algorithm>
|
||
|
#include <exception>
|
||
|
#include <boost/assert.hpp>
|
||
|
|
||
|
namespace boost { namespace mpi {
|
||
|
|
||
|
|
||
|
/************************************************************************
|
||
|
* Implementation details *
|
||
|
************************************************************************/
|
||
|
namespace detail {
|
||
|
/**********************************************************************
|
||
|
* Simple prefix reduction with MPI_Scan *
|
||
|
**********************************************************************/
|
||
|
|
||
|
// We are performing prefix reduction for a type that has an
|
||
|
// associated MPI datatype and operation, so we'll use MPI_Scan
|
||
|
// directly.
|
||
|
template<typename T, typename Op>
|
||
|
void
|
||
|
scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,
|
||
|
Op /*op*/, mpl::true_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)
|
||
|
{
|
||
|
BOOST_MPI_CHECK_RESULT(MPI_Scan,
|
||
|
(const_cast<T*>(in_values), out_values, n,
|
||
|
boost::mpi::get_mpi_datatype<T>(*in_values),
|
||
|
(is_mpi_op<Op, T>::op()), comm));
|
||
|
}
|
||
|
|
||
|
/**********************************************************************
|
||
|
* User-defined prefix reduction with MPI_Scan *
|
||
|
**********************************************************************/
|
||
|
|
||
|
// We are performing prefix reduction for a type that has an
|
||
|
// associated MPI datatype but with a custom operation. We'll use
|
||
|
// MPI_Scan directly, but we'll need to create an MPI_Op manually.
|
||
|
template<typename T, typename Op>
|
||
|
void
|
||
|
scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,
|
||
|
Op op, mpl::false_ /*is_mpi_op*/, mpl::true_ /*is_mpi_datatype*/)
|
||
|
{
|
||
|
user_op<Op, T> mpi_op(op);
|
||
|
BOOST_MPI_CHECK_RESULT(MPI_Scan,
|
||
|
(const_cast<T*>(in_values), out_values, n,
|
||
|
boost::mpi::get_mpi_datatype<T>(*in_values),
|
||
|
mpi_op.get_mpi_op(), comm));
|
||
|
}
|
||
|
|
||
|
/**********************************************************************
|
||
|
* User-defined, tree-based reduction for non-MPI data types *
|
||
|
**********************************************************************/
|
||
|
|
||
|
template<typename T, typename Op>
|
||
|
void
|
||
|
upper_lower_scan(const communicator& comm, const T* in_values, int n,
|
||
|
T* out_values, Op& op, int lower, int upper)
|
||
|
{
|
||
|
int tag = environment::collectives_tag();
|
||
|
int rank = comm.rank();
|
||
|
|
||
|
if (lower + 1 == upper) {
|
||
|
std::copy(in_values, in_values + n, out_values);
|
||
|
} else {
|
||
|
int middle = (lower + upper) / 2;
|
||
|
|
||
|
if (rank < middle) {
|
||
|
// Lower half
|
||
|
upper_lower_scan(comm, in_values, n, out_values, op, lower, middle);
|
||
|
|
||
|
// If we're the last process in the lower half, send our values
|
||
|
// to everyone in the upper half.
|
||
|
if (rank == middle - 1) {
|
||
|
packed_oarchive oa(comm);
|
||
|
for (int i = 0; i < n; ++i)
|
||
|
oa << out_values[i];
|
||
|
|
||
|
for (int p = middle; p < upper; ++p)
|
||
|
comm.send(p, tag, oa);
|
||
|
}
|
||
|
} else {
|
||
|
// Upper half
|
||
|
upper_lower_scan(comm, in_values, n, out_values, op, middle, upper);
|
||
|
|
||
|
// Receive value from the last process in the lower half.
|
||
|
packed_iarchive ia(comm);
|
||
|
comm.recv(middle - 1, tag, ia);
|
||
|
|
||
|
// Combine value that came from the left with our value
|
||
|
T left_value;
|
||
|
for (int i = 0; i < n; ++i)
|
||
|
{
|
||
|
ia >> left_value;
|
||
|
out_values[i] = op(left_value, out_values[i]);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// We are performing prefix reduction for a type that has no
|
||
|
// associated MPI datatype and operation, so we'll use a simple
|
||
|
// upper/lower algorithm.
|
||
|
template<typename T, typename Op>
|
||
|
inline void
|
||
|
scan_impl(const communicator& comm, const T* in_values, int n, T* out_values,
|
||
|
Op op, mpl::false_ /*is_mpi_op*/, mpl::false_/*is_mpi_datatype*/)
|
||
|
{
|
||
|
upper_lower_scan(comm, in_values, n, out_values, op, 0, comm.size());
|
||
|
}
|
||
|
} // end namespace detail
|
||
|
|
||
|
|
||
|
template<typename T, typename Op>
|
||
|
inline void
|
||
|
scan(const communicator& comm, const T& in_value, T& out_value, Op op)
|
||
|
{
|
||
|
detail::scan_impl(comm, &in_value, 1, &out_value, op,
|
||
|
is_mpi_op<Op, T>(), is_mpi_datatype<T>());
|
||
|
}
|
||
|
|
||
|
template<typename T, typename Op>
|
||
|
inline void
|
||
|
scan(const communicator& comm, const T* in_values, int n, T* out_values, Op op)
|
||
|
{
|
||
|
detail::scan_impl(comm, in_values, n, out_values, op,
|
||
|
is_mpi_op<Op, T>(), is_mpi_datatype<T>());
|
||
|
}
|
||
|
|
||
|
template<typename T, typename Op>
|
||
|
inline T
|
||
|
scan(const communicator& comm, const T& in_value, Op op)
|
||
|
{
|
||
|
T out_value;
|
||
|
detail::scan_impl(comm, &in_value, 1, &out_value, op,
|
||
|
is_mpi_op<Op, T>(), is_mpi_datatype<T>());
|
||
|
return out_value;
|
||
|
}
|
||
|
|
||
|
} } // end namespace boost::mpi
|
||
|
|
||
|
#endif // BOOST_MPI_SCAN_HPP
|