doxygen/moose/RankMap_8C_source.html

 //* This file is part of the MOOSE framework
 //* https://mooseframework.inl.gov
 //*
 //* All rights reserved, see COPYRIGHT for full restrictions
 //* https://github.com/idaholab/moose/blob/master/COPYRIGHT
 //*
 //* Licensed under LGPL 2.1, please see LICENSE for details
 //* https://www.gnu.org/licenses/lgpl-2.1.html

 #include "RankMap.h"
 #include "PerfGraphInterface.h"

 #include "MooseApp.h"

 #include "libmesh/parallel.h"

 RankMap::RankMap(const Parallel::Communicator & comm, PerfGraph & perf_graph)
   : ParallelObject(comm), PerfGraphInterface(perf_graph, "RankMap")
 {
   TIME_SECTION("construct", 2, "Constructing RankMap");

   auto num_procs = n_processors();
   _rank_to_hardware_id.resize(num_procs);

   Parallel::Communicator shmem_comm;
   _communicator.split_by_type(MPI_COMM_TYPE_SHARED, 0, MPI_INFO_NULL, shmem_comm);

   // This will be the world rank of the root process
   // from the shared memory communicator we're getting ready to create
   // Each process on the same node will end up with the same world_rank
   processor_id_type world_rank = processor_id();

   // Broadcast the world rank of the sub group root to all processes within this communicator
   shmem_comm.broadcast(world_rank, 0);

   // Send the info to everyone
   std::vector<processor_id_type> world_ranks(num_procs);
   _communicator.allgather(world_rank, world_ranks);

   // Map of world_rank to hardware_id
   std::map<unsigned int, unsigned int> world_rank_to_hardware_id;

   // Assign a contiguous unique numerical id to each shared memory group
   unsigned int next_id = 0;

   for (MooseIndex(world_ranks) pid = 0; pid < world_ranks.size(); pid++)
   {
     auto world_rank = world_ranks[pid];

     auto it = world_rank_to_hardware_id.lower_bound(world_rank);

     unsigned int current_id = 0;

     // If we've seen this world_rank before then use its already given ID
     if (it != world_rank_to_hardware_id.end() && it->first == world_rank)
       current_id = it->second;
     else // Create the new ID
     {
       current_id = next_id++;

       world_rank_to_hardware_id.emplace_hint(it, world_rank, current_id);
     }

     _rank_to_hardware_id[pid] = current_id;

     // Side-effect insertion utilized
     _hardware_id_to_ranks[current_id].emplace_back(pid);
   }
 }
libMesh::Parallel::Communicator::allgather
void allgather(const T &send_data, std::vector< T, A > &recv_data) const

libMesh::Parallel::Communicator

RankMap::_rank_to_hardware_id
std::vector< unsigned int > _rank_to_hardware_id
Each entry corresponds to the hardware_id for that PID.
Definition: RankMap.h:63

RankMap.h

RankMap::_hardware_id_to_ranks
std::unordered_map< unsigned int, std::vector< processor_id_type > > _hardware_id_to_ranks
Map of hardware_id -> ranks on that node.
Definition: RankMap.h:60

libMesh::ParallelObject::_communicator
const Parallel::Communicator & _communicator

processor_id_type
uint8_t processor_id_type

libMesh::ParallelObject::n_processors
processor_id_type n_processors() const

MooseApp.h

PerfGraphInterface
Interface for objects interacting with the PerfGraph.
Definition: PerfGraphInterface.h:59

libMesh::Parallel::Communicator::broadcast
void broadcast(T &data, const unsigned int root_id=0, const bool identical_sizes=false) const

libMesh::Parallel::Communicator::split_by_type
void split_by_type(int split_type, int key, info i, Communicator &target) const

RankMap::RankMap
RankMap(const libMesh::Parallel::Communicator &comm, PerfGraph &perf_graph)
Constructs and fills the map.
Definition: RankMap.C:17

libMesh::ParallelObject::processor_id
processor_id_type processor_id() const

PerfGraph
The PerfGraph will hold the master list of all registered performance segments and the head PerfNode...
Definition: PerfGraph.h:43

PerfGraphInterface.h