d4/d32/communicator_8hpp_source.html

// Copyright (c) 2013-2022 Anton Kozhevnikov, Thomas Schulthess

// All rights reserved.

//

// Redistribution and use in source and binary forms, with or without modification, are permitted provided that

// the following conditions are met:

//

// 1. Redistributions of source code must retain the above copyright notice, this list of conditions and the

//    following disclaimer.

// 2. Redistributions in binary form must reproduce the above copyright notice, this list of conditions

//    and the following disclaimer in the documentation and/or other materials provided with the distribution.

//

// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED

// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A

// PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR

// ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER

// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR

// OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


/** \file communicator.hpp

 *

 *  \brief Contains declaration and implementation of mpi::Communicator class.

 */


#ifndef __COMMUNICATOR_HPP__

#define __COMMUNICATOR_HPP__


#include <mpi.h>

#include <cassert>

#include <vector>

#include <complex>

#include <cstdarg>

#include <functional>

#include <memory>

#include <algorithm>

#include <cstring>

#include <cstdio>

#include <map>


namespace sirius {


/// MPI related functions and classes.

namespace mpi {


/// Get number of ranks per node.

int num_ranks_per_node();


/// Get GPU device id associated with the current rank.

int get_device_id(int num_devices__);


#define CALL_MPI(func__, args__)                                                     \

{                                                                                    \

    if (func__ args__ != MPI_SUCCESS) {                                              \

        std::printf("error in %s at line %i of file %s\n", #func__, __LINE__, __FILE__);  \

        MPI_Abort(MPI_COMM_WORLD, -1);                                               \

    }                                                                                \

}


/// Tyoe of MPI reduction.

enum class op_t

{

    sum,

    max,

    min,

    land

};


template <op_t op>

struct op_wrapper;


template <>

struct op_wrapper<op_t::sum>

{

    operator MPI_Op() const noexcept {return MPI_SUM;}

};


template <>

struct op_wrapper<op_t::max>

{

    operator MPI_Op() const noexcept {return MPI_MAX;}

};


template <>

struct op_wrapper<op_t::min>

{

    operator MPI_Op() const noexcept {return MPI_MIN;}

};


template <>

struct op_wrapper<op_t::land>

{

    operator MPI_Op() const noexcept {return MPI_LAND;}

};


template <typename T>

struct type_wrapper;


template <>

struct type_wrapper<float>

{

    operator MPI_Datatype() const noexcept {return MPI_FLOAT;}

};


template <>

struct type_wrapper<std::complex<float>>

{

    operator MPI_Datatype() const noexcept {return MPI_C_FLOAT_COMPLEX;}

};


template <>

struct type_wrapper<double>

{

    operator MPI_Datatype() const noexcept {return MPI_DOUBLE;}

};


template <>

struct type_wrapper<std::complex<double>>

{

    operator MPI_Datatype() const noexcept {return MPI_C_DOUBLE_COMPLEX;}

};


template <>

struct type_wrapper<long double>

{

    operator MPI_Datatype() const noexcept {return MPI_LONG_DOUBLE;}

};


template <>

struct type_wrapper<int>

{

    operator MPI_Datatype() const noexcept {return MPI_INT;}

};


template <>

struct type_wrapper<int16_t>

{

    operator MPI_Datatype() const noexcept {return MPI_SHORT;}

};


template <>

struct type_wrapper<char>

{

    operator MPI_Datatype() const noexcept {return MPI_CHAR;}

};


template <>

struct type_wrapper<unsigned char>

{

    operator MPI_Datatype() const noexcept {return MPI_UNSIGNED_CHAR;}

};


template <>

struct type_wrapper<unsigned long long>

{

    operator MPI_Datatype() const noexcept {return MPI_UNSIGNED_LONG_LONG;}

};


template <>

struct type_wrapper<unsigned long>

{

    operator MPI_Datatype() const noexcept {return MPI_UNSIGNED_LONG;}

};


template <>

struct type_wrapper<bool>

{

    operator MPI_Datatype() const noexcept {return MPI_C_BOOL;}

};


template <>

struct type_wrapper<uint32_t>

{

    operator MPI_Datatype() const noexcept {return MPI_UINT32_T;}

};


struct block_data_descriptor

{

    int num_ranks{-1};

    std::vector<int> counts;

    std::vector<int> offsets;


    block_data_descriptor()

    {

    }


    block_data_descriptor(int num_ranks__)

        : num_ranks(num_ranks__)

    {

        counts  = std::vector<int>(num_ranks, 0);

        offsets = std::vector<int>(num_ranks, 0);

    }


    void calc_offsets()

    {

        for (int i = 1; i < num_ranks; i++) {

            offsets[i] = offsets[i - 1] + counts[i - 1];

        }

    }


    inline int size() const

    {

        return counts.back() + offsets.back();

    }

};


class Request

{

  private:

    MPI_Request handler_;

  public:

    ~Request()

    {

        //CALL_MPI(MPI_Request_free, (&handler_));

    }

    void wait()

    {

        CALL_MPI(MPI_Wait, (&handler_, MPI_STATUS_IGNORE));

    }


    MPI_Request& handler()

    {

        return handler_;

    }

};


struct mpi_comm_deleter

{

    void operator()(MPI_Comm* comm__) const

    {

        int mpi_finalized_flag;

        MPI_Finalized(&mpi_finalized_flag);

        if (!mpi_finalized_flag) {

            CALL_MPI(MPI_Comm_free, (comm__));

        }

        delete comm__;

    }

};


/// MPI communicator wrapper.

class Communicator

{

  private:

    /// Raw MPI communicator.

    MPI_Comm mpi_comm_raw_{MPI_COMM_NULL};

    /// Smart pointer to allocated MPI communicator.

    std::shared_ptr<MPI_Comm> mpi_comm_;

    /// Store communicator's rank.

    int rank_{-1};

    /// Store communicator's size.

    int size_{-1};


    void init()

    {

        assert(mpi_comm_raw_ != MPI_COMM_NULL);

        CALL_MPI(MPI_Comm_rank, (mpi_comm_raw_, &rank_));

        CALL_MPI(MPI_Comm_size, (mpi_comm_raw_, &size_));

    }


  public:

    /// Default constructor.

    Communicator()

    {

    }


    /// Constructor for existing communicator.

    explicit Communicator(MPI_Comm mpi_comm__)

        : mpi_comm_raw_(mpi_comm__)

    {

        init();

    }


    /// Constructor for new communicator.

    explicit Communicator(std::shared_ptr<MPI_Comm> comm__)

        : mpi_comm_raw_(*comm__)

        , mpi_comm_(comm__)

    {

        init();

    }


    /// MPI initialization.

    static void initialize(int required__)

    {

        int provided;


        MPI_Init_thread(NULL, NULL, required__, &provided);


        MPI_Query_thread(&provided);

        if ((provided < required__) && (Communicator::world().rank() == 0)) {

            std::printf("Warning! Required level of thread support is not provided.\n");

            std::printf("provided: %d \nrequired: %d\n", provided, required__);

        }

    }


    /// MPI shut down.

    static void finalize()

    {

        MPI_Finalize();

    }


    static bool is_finalized()

    {

        int mpi_finalized_flag;

        MPI_Finalized(&mpi_finalized_flag);

        return mpi_finalized_flag == true;

    }


    static Communicator const& self()

    {

        static Communicator comm(MPI_COMM_SELF);

        return comm;

    }


    static Communicator const& world()

    {

        static Communicator comm(MPI_COMM_WORLD);

        return comm;

    }


    static Communicator const& null()

    {

        static Communicator comm(MPI_COMM_NULL);

        return comm;

    }


    void abort(int errcode__) const

    {

        CALL_MPI(MPI_Abort, (this->native(), errcode__));

    }


    inline Communicator cart_create(int ndims__, int const* dims__, int const* periods__) const

    {

        auto comm_sptr = std::shared_ptr<MPI_Comm>(new MPI_Comm, mpi_comm_deleter());

        CALL_MPI(MPI_Cart_create, (this->native(), ndims__, dims__, periods__, 0, comm_sptr.get()));

        return Communicator(comm_sptr);

    }


    inline Communicator cart_sub(int const* remain_dims__) const

    {

        auto comm_sptr = std::shared_ptr<MPI_Comm>(new MPI_Comm, mpi_comm_deleter());

        CALL_MPI(MPI_Cart_sub, (this->native(), remain_dims__, comm_sptr.get()));

        return Communicator(comm_sptr);

    }


    inline Communicator split(int color__) const

    {

        auto comm_sptr = std::shared_ptr<MPI_Comm>(new MPI_Comm, mpi_comm_deleter());

        CALL_MPI(MPI_Comm_split, (this->native(), color__, rank(), comm_sptr.get()));

        return Communicator(comm_sptr);

    }


    inline Communicator duplicate() const

    {

        auto comm_sptr = std::shared_ptr<MPI_Comm>(new MPI_Comm, mpi_comm_deleter());

        CALL_MPI(MPI_Comm_dup, (this->native(), comm_sptr.get()));

        return Communicator(comm_sptr);

    }


    /// Mapping between Fortran and SIRIUS MPI communicators.

    static Communicator const& map_fcomm(int fcomm__)

    {

        static std::map<int, Communicator> fcomm_map;

        if (!fcomm_map.count(fcomm__)) {

            fcomm_map[fcomm__] = Communicator(MPI_Comm_f2c(fcomm__));

        }


        auto& comm = fcomm_map[fcomm__];

        return comm;

    }


    /// Return the native raw MPI communicator handler.

    inline MPI_Comm native() const

    {

        return mpi_comm_raw_;

    }


    static int get_tag(int i__, int j__)

    {

        if (i__ > j__) {

            std::swap(i__, j__);

        }

        return (j__ * (j__ + 1) / 2 + i__ + 1) << 6;

    }


    static std::string processor_name()

    {

        char name[MPI_MAX_PROCESSOR_NAME];

        int len;

        CALL_MPI(MPI_Get_processor_name, (name, &len));

        return std::string(name, len);

    }


    /// Rank of MPI process inside communicator.

    inline int rank() const

    {

        return rank_;

    }


    /// Size of the communicator (number of ranks).

    inline int size() const

    {

        return size_;

    }


    /// Rank of MPI process inside communicator with associated Cartesian partitioning.

    inline int cart_rank(std::vector<int> const& coords__) const

    {

        if (this->native() == MPI_COMM_SELF) {

            return 0;

        }


        int r;

        CALL_MPI(MPI_Cart_rank, (this->native(), &coords__[0], &r));

        return r;

    }


    inline bool is_null() const

    {

        return (mpi_comm_raw_ == MPI_COMM_NULL);

    }


    inline void barrier() const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Barrier");

#endif

        assert(this->native() != MPI_COMM_NULL);

        CALL_MPI(MPI_Barrier, (this->native()));

    }


    template <typename T, op_t mpi_op__ = op_t::sum>

    inline void reduce(T* buffer__, int count__, int root__) const

    {

        if (root__ == rank()) {

            CALL_MPI(MPI_Reduce, (MPI_IN_PLACE, buffer__, count__, type_wrapper<T>(),

                                  op_wrapper<mpi_op__>(), root__, this->native()));

        } else {

            CALL_MPI(MPI_Reduce, (buffer__, NULL, count__, type_wrapper<T>(),

                                  op_wrapper<mpi_op__>(), root__, this->native()));

        }

    }


    template <typename T, op_t mpi_op__ = op_t::sum>

    inline void reduce(T* buffer__, int count__, int root__, MPI_Request* req__) const

    {

        if (root__ == rank()) {

            CALL_MPI(MPI_Ireduce, (MPI_IN_PLACE, buffer__, count__, type_wrapper<T>(),

                                   op_wrapper<mpi_op__>(), root__, this->native(), req__));

        } else {

            CALL_MPI(MPI_Ireduce, (buffer__, NULL, count__, type_wrapper<T>(),

                                   op_wrapper<mpi_op__>(), root__, this->native(), req__));

        }

    }


    template <typename T, op_t mpi_op__ = op_t::sum>

    void reduce(T const* sendbuf__, T* recvbuf__, int count__, int root__) const

    {

        CALL_MPI(MPI_Reduce, (sendbuf__, recvbuf__, count__, type_wrapper<T>(),

                              op_wrapper<mpi_op__>(), root__, this->native()));

    }


    template <typename T, op_t mpi_op__ = op_t::sum>

    void reduce(T const* sendbuf__, T* recvbuf__, int count__, int root__, MPI_Request* req__) const

    {

        CALL_MPI(MPI_Ireduce, (sendbuf__, recvbuf__, count__, type_wrapper<T>(),

                               op_wrapper<mpi_op__>(), root__, this->native(), req__));

    }


    /// Perform the in-place (the output buffer is used as the input buffer) all-to-all reduction.

    template <typename T, op_t mpi_op__ = op_t::sum>

    inline void allreduce(T* buffer__, int count__) const

    {

        CALL_MPI(MPI_Allreduce, (MPI_IN_PLACE, buffer__, count__, type_wrapper<T>(),

                                 op_wrapper<mpi_op__>(), this->native()));

    }


    /// Perform the in-place (the output buffer is used as the input buffer) all-to-all reduction.

    template <typename T, op_t op__ = op_t::sum>

    inline void allreduce(std::vector<T>& buffer__) const

    {

        allreduce<T, op__>(buffer__.data(), static_cast<int>(buffer__.size()));

    }


    template <typename T, op_t mpi_op__ = op_t::sum>

    inline void iallreduce(T* buffer__, int count__, MPI_Request* req__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Iallreduce");

#endif

        CALL_MPI(MPI_Iallreduce, (MPI_IN_PLACE, buffer__, count__, type_wrapper<T>(),

                                  op_wrapper<mpi_op__>(), this->native(), req__));

    }


    /// Perform buffer broadcast.

    template <typename T>

    inline void bcast(T* buffer__, int count__, int root__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Bcast");

#endif

        CALL_MPI(MPI_Bcast, (buffer__, count__, type_wrapper<T>(), root__, this->native()));

    }


    inline void bcast(std::string& str__, int root__) const

    {

        int sz;

        if (rank() == root__) {

            sz = static_cast<int>(str__.size());

        }

        bcast(&sz, 1, root__);

        char* buf = new char[sz + 1];

        if (rank() == root__) {

            std::copy(str__.c_str(), str__.c_str() + sz + 1, buf);

        }

        bcast(buf, sz + 1, root__);

        str__ = std::string(buf);

        delete[] buf;

    }


    /// In-place MPI_Allgatherv.

    template <typename T>

    void

    allgather(T* buffer__, int const* recvcounts__, int const* displs__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Allgatherv");

#endif

        CALL_MPI(MPI_Allgatherv, (MPI_IN_PLACE, 0, MPI_DATATYPE_NULL, buffer__, recvcounts__, displs__,

                                  type_wrapper<T>(), this->native()));

    }


    /// Out-of-place MPI_Allgatherv.

    template <typename T>

    void

    allgather(T const* sendbuf__, int sendcount__, T* recvbuf__, int const* recvcounts__, int const* displs__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Allgatherv");

#endif

        CALL_MPI(MPI_Allgatherv, (sendbuf__, sendcount__, type_wrapper<T>(), recvbuf__, recvcounts__,

                                  displs__, type_wrapper<T>(), this->native()));

    }


    template <typename T>

    void

    allgather(T const* sendbuf__, T* recvbuf__, int count__, int displs__) const

    {

        std::vector<int> v(size() * 2);

        v[2 * rank()]     = count__;

        v[2 * rank() + 1] = displs__;


        CALL_MPI(MPI_Allgather,

                 (MPI_IN_PLACE, 0, MPI_DATATYPE_NULL, v.data(), 2, type_wrapper<int>(), this->native()));


        std::vector<int> counts(size());

        std::vector<int> displs(size());


        for (int i = 0; i < size(); i++) {

            counts[i] = v[2 * i];

            displs[i] = v[2 * i + 1];

        }


        CALL_MPI(MPI_Allgatherv, (sendbuf__, count__, type_wrapper<T>(), recvbuf__, counts.data(),

                                  displs.data(), type_wrapper<T>(), this->native()));

    }


    /// In-place MPI_Allgatherv.

    template <typename T>

    void

    allgather(T* buffer__, int count__, int displs__) const

    {

        std::vector<int> v(size() * 2);

        v[2 * rank()]     = count__;

        v[2 * rank() + 1] = displs__;


        CALL_MPI(MPI_Allgather,

                 (MPI_IN_PLACE, 0, MPI_DATATYPE_NULL, v.data(), 2, type_wrapper<int>(), this->native()));


        std::vector<int> counts(size());

        std::vector<int> displs(size());


        for (int i = 0; i < size(); i++) {

            counts[i] = v[2 * i];

            displs[i] = v[2 * i + 1];

        }

        allgather(buffer__, counts.data(), displs.data());

    }


    template <typename T>

    void send(T const* buffer__, int count__, int dest__, int tag__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Send");

#endif

        CALL_MPI(MPI_Send, (buffer__, count__, type_wrapper<T>(), dest__, tag__, this->native()));

    }


    template <typename T>

    Request isend(T const* buffer__, int count__, int dest__, int tag__) const

    {

        Request req;

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Isend");

#endif

        CALL_MPI(MPI_Isend, (buffer__, count__, type_wrapper<T>(), dest__, tag__, this->native(), &req.handler()));

        return req;

    }


    template <typename T>

    void recv(T* buffer__, int count__, int source__, int tag__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Recv");

#endif

        CALL_MPI(MPI_Recv,

                 (buffer__, count__, type_wrapper<T>(), source__, tag__, this->native(), MPI_STATUS_IGNORE));

    }


    template <typename T>

    Request irecv(T* buffer__, int count__, int source__, int tag__) const

    {

        Request req;

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Irecv");

#endif

        CALL_MPI(MPI_Irecv, (buffer__, count__, type_wrapper<T>(), source__, tag__, this->native(), &req.handler()));

        return req;

    }


    template <typename T>

    void gather(T const* sendbuf__, T* recvbuf__, int const* recvcounts__, int const* displs__, int root__) const

    {

        int sendcount = recvcounts__[rank()];


#if defined(__PROFILE_MPI)

        PROFILE("MPI_Gatherv");

#endif

        CALL_MPI(MPI_Gatherv, (sendbuf__, sendcount, type_wrapper<T>(), recvbuf__, recvcounts__, displs__,

                               type_wrapper<T>(), root__, this->native()));

    }


    /// Gather data on a given rank.

    template <typename T>

    void gather(T const* sendbuf__, T* recvbuf__, int offset__, int count__, int root__) const

    {


#if defined(__PROFILE_MPI)

        PROFILE("MPI_Gatherv");

#endif

        std::vector<int> v(size() * 2);

        v[2 * rank()]     = count__;

        v[2 * rank() + 1] = offset__;


        CALL_MPI(MPI_Allgather,

                 (MPI_IN_PLACE, 0, MPI_DATATYPE_NULL, v.data(), 2, type_wrapper<int>(), this->native()));


        std::vector<int> counts(size());

        std::vector<int> offsets(size());


        for (int i = 0; i < size(); i++) {

            counts[i]  = v[2 * i];

            offsets[i] = v[2 * i + 1];

        }

        CALL_MPI(MPI_Gatherv, (sendbuf__, count__, type_wrapper<T>(), recvbuf__, counts.data(),

                               offsets.data(), type_wrapper<T>(), root__, this->native()));

    }


    template <typename T>

    void scatter(T const* sendbuf__, T* recvbuf__, int const* sendcounts__, int const* displs__, int root__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Scatterv");

#endif

        int recvcount = sendcounts__[rank()];

        CALL_MPI(MPI_Scatterv, (sendbuf__, sendcounts__, displs__, type_wrapper<T>(), recvbuf__, recvcount,

                                type_wrapper<T>(), root__, this->native()));

    }


    template <typename T>

    void alltoall(T const* sendbuf__, int sendcounts__, T* recvbuf__, int recvcounts__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Alltoall");

#endif

        CALL_MPI(MPI_Alltoall, (sendbuf__, sendcounts__, type_wrapper<T>(), recvbuf__, recvcounts__,

                                type_wrapper<T>(), this->native()));

    }


    template <typename T>

    void alltoall(T const* sendbuf__, int const* sendcounts__, int const* sdispls__, T* recvbuf__,

                  int const* recvcounts__, int const* rdispls__) const

    {

#if defined(__PROFILE_MPI)

        PROFILE("MPI_Alltoallv");

#endif

        CALL_MPI(MPI_Alltoallv, (sendbuf__, sendcounts__, sdispls__, type_wrapper<T>(), recvbuf__,

                                 recvcounts__, rdispls__, type_wrapper<T>(), this->native()));

    }

};


} // namespace mpi


} // namespace sirius


#endif // __COMMUNICATOR_HPP__

sirius::mpi::Communicator
MPI communicator wrapper.
Definition: communicator.hpp:241

sirius::mpi::Communicator::bcast
void bcast(T *buffer__, int count__, int root__) const
Perform buffer broadcast.
Definition: communicator.hpp:495

sirius::mpi::Communicator::allgather
void allgather(T *buffer__, int const *recvcounts__, int const *displs__) const
In-place MPI_Allgatherv.
Definition: communicator.hpp:522

sirius::mpi::Communicator::initialize
static void initialize(int required__)
MPI initialization.
Definition: communicator.hpp:281

sirius::mpi::Communicator::allreduce
void allreduce(std::vector< T > &buffer__) const
Perform the in-place (the output buffer is used as the input buffer) all-to-all reduction.
Definition: communicator.hpp:478

sirius::mpi::Communicator::allgather
void allgather(T const *sendbuf__, int sendcount__, T *recvbuf__, int const *recvcounts__, int const *displs__) const
Out-of-place MPI_Allgatherv.
Definition: communicator.hpp:534

sirius::mpi::Communicator::gather
void gather(T const *sendbuf__, T *recvbuf__, int offset__, int count__, int root__) const
Gather data on a given rank.
Definition: communicator.hpp:643

sirius::mpi::Communicator::mpi_comm_raw_
MPI_Comm mpi_comm_raw_
Raw MPI communicator.
Definition: communicator.hpp:244

sirius::mpi::Communicator::rank_
int rank_
Store communicator's rank.
Definition: communicator.hpp:248

sirius::mpi::Communicator::allgather
void allgather(T *buffer__, int count__, int displs__) const
In-place MPI_Allgatherv.
Definition: communicator.hpp:569

sirius::mpi::Communicator::size_
int size_
Store communicator's size.
Definition: communicator.hpp:250

sirius::mpi::Communicator::native
MPI_Comm native() const
Return the native raw MPI communicator handler.
Definition: communicator.hpp:371

sirius::mpi::Communicator::size
int size() const
Size of the communicator (number of ranks).
Definition: communicator.hpp:399

sirius::mpi::Communicator::Communicator
Communicator()
Default constructor.
Definition: communicator.hpp:261

sirius::mpi::Communicator::cart_rank
int cart_rank(std::vector< int > const &coords__) const
Rank of MPI process inside communicator with associated Cartesian partitioning.
Definition: communicator.hpp:405

sirius::mpi::Communicator::allreduce
void allreduce(T *buffer__, int count__) const
Perform the in-place (the output buffer is used as the input buffer) all-to-all reduction.
Definition: communicator.hpp:470

sirius::mpi::Communicator::map_fcomm
static Communicator const & map_fcomm(int fcomm__)
Mapping between Fortran and SIRIUS MPI communicators.
Definition: communicator.hpp:359

sirius::mpi::Communicator::rank
int rank() const
Rank of MPI process inside communicator.
Definition: communicator.hpp:393

sirius::mpi::Communicator::finalize
static void finalize()
MPI shut down.
Definition: communicator.hpp:295

sirius::mpi::Communicator::mpi_comm_
std::shared_ptr< MPI_Comm > mpi_comm_
Smart pointer to allocated MPI communicator.
Definition: communicator.hpp:246

sirius::mpi::Communicator::Communicator
Communicator(MPI_Comm mpi_comm__)
Constructor for existing communicator.
Definition: communicator.hpp:266

sirius::mpi::Communicator::Communicator
Communicator(std::shared_ptr< MPI_Comm > comm__)
Constructor for new communicator.
Definition: communicator.hpp:273

sirius::mpi::Request
Definition: communicator.hpp:207

sirius::acc::copy
void copy(T *target__, T const *source__, size_t n__)
Copy memory inside a device.
Definition: acc.hpp:320

sirius::mpi::get_device_id
int get_device_id(int num_devices__)
Get GPU device id associated with the current rank.
Definition: communicator.cpp:66

sirius::mpi::op_t
op_t
Tyoe of MPI reduction.
Definition: communicator.hpp:61

sirius::mpi::num_ranks_per_node
int num_ranks_per_node()
Get number of ranks per node.
Definition: communicator.cpp:32

sirius
Namespace of the SIRIUS library.
Definition: sirius.f90:5

sirius::mpi::block_data_descriptor
Definition: communicator.hpp:177

sirius::mpi::mpi_comm_deleter
Definition: communicator.hpp:227

sirius::mpi::op_wrapper
Definition: communicator.hpp:69

sirius::mpi::type_wrapper< int >
Definition: communicator.hpp:130

sirius::mpi::type_wrapper
Definition: communicator.hpp:96