CoreNEURON
partrans_setup.cpp
Go to the documentation of this file.
1 /*
2 # =============================================================================
3 # Copyright (c) 2016 - 2021 Blue Brain Project/EPFL
4 #
5 # See top-level LICENSE file for details.
6 # =============================================================================
7 */
8 
9 #include <map>
10 #include <vector>
11 
13 #include "coreneuron/nrnconf.h"
15 #include "coreneuron/mpi/nrnmpi.h"
19 
20 namespace coreneuron {
21 using namespace coreneuron::nrn_partrans;
22 
24 
25 class SidInfo {
26  public:
27  std::vector<int> tids_;
28  std::vector<int> indices_;
29 };
30 
31 } // namespace coreneuron
32 #if NRNLONGSGID
33 #define sgid_alltoallv nrnmpi_long_alltoallv
34 #else
35 #define sgid_alltoallv nrnmpi_int_alltoallv
36 #endif
37 
38 #define HAVEWANT_t sgid_t
39 #define HAVEWANT_alltoallv sgid_alltoallv
40 #define HAVEWANT2Int std::map<sgid_t, int>
42 
43 namespace coreneuron {
44 using namespace coreneuron::nrn_partrans;
45 
46 void nrn_partrans::gap_mpi_setup(int ngroup) {
47  // printf("%d gap_mpi_setup ngroup=%d\n", nrnmpi_myid, ngroup);
48 
49  // count total_nsrc, total_ntar and allocate.
50  // Possible either or both are 0 on this process.
51  size_t total_nsrc = 0, total_ntar = 0;
52  for (int tid = 0; tid < ngroup; ++tid) {
53  auto& si = setup_info_[tid];
54  total_nsrc += si.src_sid.size();
55  total_ntar += si.tar_sid.size();
56  }
57 
58  // have and want arrays (add 1 to guarantee new ... is an array.)
59  sgid_t* have = new sgid_t[total_nsrc + 1];
60  sgid_t* want = new sgid_t[total_ntar + 1];
61 
62  // map from source sid to (tid, index), ie. NrnThread[tid]._data[index].
63  // and target sid to lists of (tid, index) for memb_list
64  // also count the map sizes and fill have and want arrays
65  std::map<sgid_t, SidInfo> src2info;
66  std::map<sgid_t, SidInfo> tar2info;
67 
68  int src2info_size = 0, tar2info_size = 0; // number of unique sids
69  for (int tid = 0; tid < ngroup; ++tid) {
70  auto& si = setup_info_[tid];
71  // Sgid has unique source.
72 
73  for (size_t i = 0; i < si.src_sid.size(); ++i) {
74  sgid_t sid = si.src_sid[i];
75  SidInfo sidinfo;
76  sidinfo.tids_.push_back(tid);
77  sidinfo.indices_.push_back(i);
78  src2info[sid] = sidinfo;
79  have[src2info_size] = sid;
80  src2info_size++;
81  }
82  // Possibly many targets of same sid
83  // Only want unique sids. From each, can obtain all its targets.
84  for (size_t i = 0; i < si.tar_sid.size(); ++i) {
85  sgid_t sid = si.tar_sid[i];
86  if (tar2info.find(sid) == tar2info.end()) {
87  tar2info[sid] = SidInfo();
88  want[tar2info_size] = sid;
89  tar2info_size++;
90  }
91  SidInfo& sidinfo = tar2info[sid];
92  sidinfo.tids_.push_back(tid);
93  sidinfo.indices_.push_back(i);
94  }
95  }
96 
97  // 2) Call the have_to_want function.
98  sgid_t* send_to_want;
99  sgid_t* recv_from_have;
100 
101  have_to_want(have,
102  src2info_size,
103  want,
104  tar2info_size,
105  send_to_want,
106  outsrccnt_,
107  outsrcdspl_,
108  recv_from_have,
109  insrccnt_,
110  insrcdspl_,
112 
113  int nhost = nrnmpi_numprocs;
114 
115  // sanity check. all the sgids we are asked to send, we actually have
116  for (int i = 0; i < outsrcdspl_[nhost]; ++i) {
117  sgid_t sgid = send_to_want[i];
118  assert(src2info.find(sgid) != src2info.end());
119  }
120 
121  // sanity check. all the sgids we receive, we actually need.
122  for (int i = 0; i < insrcdspl_[nhost]; ++i) {
123  sgid_t sgid = recv_from_have[i];
124  assert(tar2info.find(sgid) != tar2info.end());
125  }
126 
127 #if CORENRN_DEBUG
128  printf("%d mpi outsrccnt_, outsrcdspl_, insrccnt, insrcdspl_\n", nrnmpi_myid);
129  for (int i = 0; i < nrnmpi_numprocs; ++i) {
130  printf("%d : %d %d %d %d\n",
131  nrnmpi_myid,
132  outsrccnt_[i],
133  outsrcdspl_[i],
134  insrccnt_[i],
135  insrcdspl_[i]);
136  }
137 #endif
138 
139  // clean up a little
140  delete[] have;
141  delete[] want;
142 
143  insrc_buf_ = new double[insrcdspl_[nhost]];
144  outsrc_buf_ = new double[outsrcdspl_[nhost]];
145 
146  // for i: src_gather[i] = NrnThread._data[src_indices[i]]
147  // for j: outsrc_buf[outsrc_indices[j]] = src_gather[gather2outsrc_indices[j]]
148  // src_indices point into NrnThread._data
149  // Many outsrc_indices elements can point to the same src_gather element
150  // but only if an sgid src datum is destined for multiple ranks.
151  for (int i = 0; i < outsrcdspl_[nhost]; ++i) {
152  sgid_t sgid = send_to_want[i];
153  SidInfo& sidinfo = src2info[sgid];
154  // only one item in the lists.
155  int tid = sidinfo.tids_[0];
156  int setup_info_index = sidinfo.indices_[0];
157 
158  auto& si = setup_info_[tid];
159  auto& ttd = transfer_thread_data_[tid];
160 
161  // Note that src_index points into NrnThread.data, as it has already
162  // been transformed using original src_type and src_index via
163  // stdindex2ptr.
164  // For copying into outsrc_buf from src_gather. This is from
165  // NrnThread._data, fixup to "from src_gather" below.
166  ttd.gather2outsrc_indices.push_back(si.src_index[setup_info_index]);
167  ttd.outsrc_indices.push_back(i);
168  }
169 
170  // Need to know src_gather index given NrnThread._data index
171  // to compute gather2outsrc_indices. And the update outsrc_indices so that
172  // for a given thread
173  // for j: outsrc_buf[outsrc_indices[j]] = src_gather[gather2outsrc_indices[j]]
174  for (int tid = 0; tid < ngroup; ++tid) {
175  auto& ttd = transfer_thread_data_[tid];
176  std::map<int, int> data2gather_indices;
177  for (size_t i = 0; i < ttd.src_indices.size(); ++i) {
178  data2gather_indices[ttd.src_indices[i]] = i;
179  }
180 
181  for (size_t i = 0; i < ttd.outsrc_indices.size(); ++i) {
182  ttd.gather2outsrc_indices[i] = data2gather_indices[ttd.gather2outsrc_indices[i]];
183  }
184  }
185 
186  // Which insrc_indices point into which NrnThread.data
187  // An sgid occurs at most once in the process recv_from_have.
188  // But it might get distributed to more than one thread and to
189  // several targets in a thread (specified by tar2info)
190  // insrc_indices is parallel to tar_indices and has size ntar of the thread.
191  // insrc_indices[i] is the index into insrc_buf
192  // tar_indices[i] is the index into NrnThread.data
193  // i.e. NrnThead._data[tar_indices[i]] = insrc_buf[insrc_indices[i]]
194  for (int i = 0; i < insrcdspl_[nhost]; ++i) {
195  sgid_t sgid = recv_from_have[i];
196  SidInfo& sidinfo = tar2info[sgid];
197  // there may be several items in the lists.
198  for (size_t j = 0; j < sidinfo.tids_.size(); ++j) {
199  int tid = sidinfo.tids_[j];
200  int index = sidinfo.indices_[j];
201 
202  transfer_thread_data_[tid].insrc_indices[index] = i;
203  }
204  }
205 
206 #if CORENRN_DEBUG
207  // things look ok so far?
208  for (int tid = 0; tid < ngroup; ++tid) {
209  SetupTransferInfo& si = setup_info_[tid];
211  for (size_t i = 0; i < si.src_sid.size(); ++i) {
212  printf("%d %d src sid=%d v_index=%d %g\n",
213  nrnmpi_myid,
214  tid,
215  si.src_sid[i],
216  ttd.src_indices[i],
217  nrn_threads[tid]._data[ttd.src_indices[i]]);
218  }
219  for (size_t i = 0; i < ttd.tar_indices.size(); ++i) {
220  printf("%d %d src sid=i%zd tar_index=%d %g\n",
221  nrnmpi_myid,
222  tid,
223  i,
224  ttd.tar_indices[i],
225  nrn_threads[tid]._data[ttd.tar_indices[i]]);
226  }
227  }
228 #endif
229 
230  delete[] send_to_want;
231  delete[] recv_from_have;
232 }
233 
234 /**
235  * For now, until conceptualization of the ordering is clear,
236  * just replace src setup_info_ indices values with stdindex2ptr determined
237  * index into NrnThread._data
238  **/
240  NrnThread& nt = *n;
241  auto& ttd = transfer_thread_data_[nt.id];
242  auto& sti = setup_info_[nt.id];
243 
244  ttd.src_gather.resize(sti.src_sid.size());
245  ttd.src_indices.resize(sti.src_sid.size());
246  ttd.insrc_indices.resize(sti.tar_sid.size());
247  ttd.tar_indices.resize(sti.tar_sid.size());
248 
249  // For copying into src_gather from NrnThread._data
250  for (size_t i = 0; i < sti.src_sid.size(); ++i) {
251  double* d = stdindex2ptr(sti.src_type[i], sti.src_index[i], nt);
252  sti.src_index[i] = int(d - nt._data);
253  }
254 
255  // For copying into NrnThread._data from insrc_buf.
256  for (size_t i = 0; i < sti.tar_sid.size(); ++i) {
257  double* d = stdindex2ptr(sti.tar_type[i], sti.tar_index[i], nt);
258  // todo : this should be revisited once nt._data will be broken
259  // into mechanism specific data
260  sti.tar_index[i] = int(d - nt._data);
261  }
262 
263  // Here we could reorder sti.src_... according to NrnThread._data index
264  // order
265 
266  // copy into TransferThreadData
267  ttd.src_indices = sti.src_index;
268  ttd.tar_indices = sti.tar_index;
269 }
270 
272  if (transfer_thread_data_) {
273  delete[] transfer_thread_data_;
274  transfer_thread_data_ = nullptr;
275  }
276  if (insrc_buf_) {
277  delete[] insrc_buf_;
278  insrc_buf_ = nullptr;
279  delete[] insrccnt_;
280  insrccnt_ = nullptr;
281  delete[] insrcdspl_;
282  insrcdspl_ = nullptr;
283  delete[] outsrc_buf_;
284  outsrc_buf_ = nullptr;
285  delete[] outsrccnt_;
286  outsrccnt_ = nullptr;
287  delete[] outsrcdspl_;
288  outsrcdspl_ = nullptr;
289  }
290 }
291 
292 } // namespace coreneuron
coreneuron::SidInfo::indices_
std::vector< int > indices_
Definition: partrans_setup.cpp:28
coreneuron::nrn_partrans::insrc_buf_
double * insrc_buf_
Definition: partrans.cpp:28
coreneuron::nrn_partrans::gap_data_indices_setup
void gap_data_indices_setup(NrnThread *nt)
For now, until conceptualization of the ordering is clear, just replace src setup_info_ indices value...
Definition: partrans_setup.cpp:239
coreneuron::nrnmpi_numprocs
int nrnmpi_numprocs
Definition: nrnmpi_def_cinc.cpp:10
coreneuron::nrn_partrans::outsrc_buf_
double * outsrc_buf_
Definition: partrans.cpp:29
coreneuron::nrn_partrans::gap_mpi_setup
void gap_mpi_setup(int ngroup)
Definition: partrans_setup.cpp:46
SetupTransferInfo
Definition: partrans.hpp:94
SetupTransferInfo::src_sid
std::vector< sgid_t > src_sid
Definition: partrans.hpp:95
have2want.h
coreneuron::NrnThread::id
int id
Definition: multicore.hpp:99
coreneuron::stdindex2ptr
double * stdindex2ptr(int mtype, int index, NrnThread &nt)
Definition: nrn_setup.cpp:636
coreneuron::have_to_want
static void have_to_want(HAVEWANT_t *have, int have_size, HAVEWANT_t *want, int want_size, HAVEWANT_t *&send_to_want, int *&send_to_want_cnt, int *&send_to_want_displ, HAVEWANT_t *&recv_from_have, int *&recv_from_have_cnt, int *&recv_from_have_displ, int(*rendezvous_rank)(HAVEWANT_t))
Definition: have2want.h:128
coreneuron::nrn_partrans::TransferThreadData::gather2outsrc_indices
std::vector< int > gather2outsrc_indices
Definition: partrans.hpp:81
coreneuron::nrn_partrans::insrcdspl_
int * insrcdspl_
Definition: partrans.hpp:116
coreneuron.hpp
coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12
coreneuron::i
int i
Definition: cellorder.cpp:485
coreneuron::nrn_partrans::outsrcdspl_
int * outsrcdspl_
Definition: partrans.hpp:116
nrniv_decl.h
nrnmpi.hpp
coreneuron::NrnThread
Definition: multicore.hpp:75
coreneuron::nrn_partrans::outsrccnt_
int * outsrccnt_
Definition: partrans.hpp:116
partrans.hpp
coreneuron::NrnThread::_data
double * _data
Definition: multicore.hpp:106
coreneuron::nrn_threads
NrnThread * nrn_threads
Definition: multicore.cpp:56
coreneuron::default_rendezvous
static int default_rendezvous(HAVEWANT_t key)
Definition: have2want.h:55
nrnconf.h
coreneuron::nrn_partrans::TransferThreadData::src_indices
std::vector< int > src_indices
Definition: partrans.hpp:79
coreneuron::nrn_partrans::TransferThreadData::tar_indices
std::vector< int > tar_indices
Definition: partrans.hpp:85
coreneuron::nrn_partrans::gap_cleanup
void gap_cleanup()
Definition: partrans_setup.cpp:271
multicore.hpp
coreneuron::nrn_partrans::TransferThreadData::insrc_indices
std::vector< int > insrc_indices
Definition: partrans.hpp:84
coreneuron::SidInfo::tids_
std::vector< int > tids_
Definition: partrans_setup.cpp:27
coreneuron::nrn_partrans::TransferThreadData
The basic problem is to copy sources to targets.
Definition: partrans.hpp:78
coreneuron::SidInfo
Definition: partrans_setup.cpp:25
coreneuron::nrnmpi_myid
int nrnmpi_myid
Definition: nrnmpi_def_cinc.cpp:11
coreneuron::nrn_partrans::insrccnt_
int * insrccnt_
Definition: partrans.cpp:30
coreneuron::nrn_partrans::setup_info_
SetupTransferInfo * setup_info_
Definition: partrans_setup.cpp:23
nrnmpi.h
coreneuron::nrn_partrans
Definition: partrans.hpp:30
sgid_t
int sgid_t
Definition: partrans.hpp:20
coreneuron::nrn_partrans::transfer_thread_data_
TransferThreadData * transfer_thread_data_
Definition: partrans.cpp:25