CoreNEURON
partrans.hpp
Go to the documentation of this file.
1 /*
2 # =============================================================================
3 # Copyright (c) 2016 - 2021 Blue Brain Project/EPFL
4 #
5 # See top-level LICENSE file for details.
6 # =============================================================================
7 */
8 
9 #pragma once
10 
12 
13 #ifndef NRNLONGSGID
14 #define NRNLONGSGID 0
15 #endif
16 
17 #if NRNLONGSGID
18 using sgid_t = int64_t;
19 #else
20 using sgid_t = int;
21 #endif
22 
23 namespace coreneuron {
24 struct Memb_list;
25 
26 extern bool nrn_have_gaps;
27 extern void nrnmpi_v_transfer();
28 extern void nrnthread_v_transfer(NrnThread*);
29 
30 namespace nrn_partrans {
31 
32 /** The basic problem is to copy sources to targets.
33  * It may be the case that a source gets copied to several targets.
34  * Sources and targets are a set of indices in NrnThread.data.
35  * A copy may be intrathread, interthread, interprocess.
36  * Copies happen every time step so efficiency is desirable.
37  * SetupTransferInfo gives us the source and target (sid, type, index) triples
38  * for a thread and all the global threads define what gets copied where.
39  * Need to process that info into TransferThreadData for each thread and
40  * the interprocessor mpi buffers insrc_buf_ and outsrc_buf transfered with
41  * MPI_Alltoallv, hopefully with a more or less optimal ordering.
42  * The compute strategy is: 1) Each thread copies its NrnThread.data source
43  * items to outsrc_buf_. 2) MPI_Allgatherv transfers outsrc_buf_ to insrc_buf_.
44  * 3) Each thread, copies insrc_buf_ values to Nrnthread.data target.
45  *
46  * Optimal ordering is probably beyond our reach but a few considerations
47  * may be useful. The typical use is for gap junctions where only voltage
48  * transferred and all instances of the HalfGap Point_process receive a
49  * voltage. Two situations are common. Voltage transfer is sparse and one
50  * to one, i.e many compartments do not have gap junctions, and those that do
51  * have only one. The other situation is that all compartments have gap
52  * junctions (e.g. syncytium of single compartment cells in the heart) and
53  * the voltage needs to be transferred to all neighboring cells (e.g. 6-18
54  * cells can be neighbors to the central cell). So on the target side, it
55  * might be good to copy to the target in target index order from the
56  * input_buf_. And on the source side, it is certainly simple to scatter
57  * to the outbut_buf_ in NrnThread.data order. Note that one expects a wide
58  * scatter to the outsrc_buf and also a wide scatter within the insrc_buf_.
59  **/
60 
61 /*
62  * In partrans.cpp: nrnmpi_v_transfer
63  * Copy NrnThead.data to outsrc_buf_ for all threads via
64  * gpu: gather src_gather[i] = NrnThread._data[src_indices[i]];
65  * gpu to host src_gather
66  * cpu: outsrc_buf_[outsrc_indices[i]] = src_gather[gather2outsrc_indices[i]];
67  *
68  * MPI_Allgatherv outsrc_buf_ to insrc_buf_
69  *
70  * host to gpu insrc_buf_
71  *
72  * In partrans.cpp: nrnthread_v_transfer
73  * insrc_buf_ to NrnThread._data via
74  * NrnThread.data[tar_indices[i]] = insrc_buf_[insrc_indices[i]];
75  * where tar_indices depends on layout, type, etc.
76  */
77 
79  std::vector<int> src_indices; // indices into NrnThread._data
80  std::vector<double> src_gather; // copy of NrnThread._data[src_indices]
81  std::vector<int> gather2outsrc_indices; // ix of src_gather that send into outsrc_indices
82  std::vector<int> outsrc_indices; // ix of outsrc_buf that receive src_gather values
83 
84  std::vector<int> insrc_indices; // insrc_buf_ indices copied to ...
85  std::vector<int> tar_indices; // indices of NrnThread.data.
86 };
87 extern TransferThreadData* transfer_thread_data_; /* array for threads */
88 
89 } // namespace nrn_partrans
90 } // namespace coreneuron
91 
92 // For direct transfer,
93 // must be same as corresponding struct SetupTransferInfo in NEURON
95  std::vector<sgid_t> src_sid;
96  std::vector<int> src_type;
97  std::vector<int> src_index;
98  std::vector<sgid_t> tar_sid;
99  std::vector<int> tar_type;
100  std::vector<int> tar_index;
101 };
102 
103 namespace coreneuron {
104 namespace nrn_partrans {
105 
106 extern SetupTransferInfo* setup_info_; /* array for threads exists only during setup*/
107 
108 extern void gap_mpi_setup(int ngroup);
109 extern void gap_data_indices_setup(NrnThread* nt);
110 extern void copy_gap_indices_to_device();
111 extern void delete_gap_indices_from_device();
112 extern void gap_cleanup();
113 
114 extern double* insrc_buf_; // Receive buffer for gap voltages
115 extern double* outsrc_buf_; // Send buffer for gap voltages
117 } // namespace nrn_partrans
118 } // namespace coreneuron
SetupTransferInfo::src_index
std::vector< int > src_index
Definition: partrans.hpp:97
coreneuron::nrn_partrans::insrc_buf_
double * insrc_buf_
Definition: partrans.cpp:28
coreneuron::nrn_partrans::gap_data_indices_setup
void gap_data_indices_setup(NrnThread *nt)
For now, until conceptualization of the ordering is clear, just replace src setup_info_ indices value...
Definition: partrans_setup.cpp:239
coreneuron::nrn_partrans::TransferThreadData::src_gather
std::vector< double > src_gather
Definition: partrans.hpp:80
SetupTransferInfo::tar_sid
std::vector< sgid_t > tar_sid
Definition: partrans.hpp:98
SetupTransferInfo::tar_type
std::vector< int > tar_type
Definition: partrans.hpp:99
coreneuron::nrn_partrans::copy_gap_indices_to_device
void copy_gap_indices_to_device()
Definition: partrans.cpp:133
coreneuron::nrn_partrans::outsrc_buf_
double * outsrc_buf_
Definition: partrans.cpp:29
coreneuron::nrn_partrans::gap_mpi_setup
void gap_mpi_setup(int ngroup)
Definition: partrans_setup.cpp:46
SetupTransferInfo
Definition: partrans.hpp:94
SetupTransferInfo::src_sid
std::vector< sgid_t > src_sid
Definition: partrans.hpp:95
coreneuron::nrn_partrans::TransferThreadData::gather2outsrc_indices
std::vector< int > gather2outsrc_indices
Definition: partrans.hpp:81
coreneuron::nrn_partrans::insrcdspl_
int * insrcdspl_
Definition: partrans.hpp:116
SetupTransferInfo::tar_index
std::vector< int > tar_index
Definition: partrans.hpp:100
coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12
coreneuron::nrn_partrans::TransferThreadData::outsrc_indices
std::vector< int > outsrc_indices
Definition: partrans.hpp:82
coreneuron::nrn_partrans::outsrcdspl_
int * outsrcdspl_
Definition: partrans.hpp:116
coreneuron::nrn_partrans::outsrccnt_
int * outsrccnt_
Definition: partrans.hpp:116
coreneuron::nrnmpi_v_transfer
void nrnmpi_v_transfer()
Definition: partrans.cpp:35
coreneuron::nrn_partrans::TransferThreadData::src_indices
std::vector< int > src_indices
Definition: partrans.hpp:79
coreneuron::nrnthread_v_transfer
void nrnthread_v_transfer(NrnThread *_nt)
Definition: partrans.cpp:108
coreneuron::nrn_partrans::TransferThreadData::tar_indices
std::vector< int > tar_indices
Definition: partrans.hpp:85
coreneuron::nrn_partrans::gap_cleanup
void gap_cleanup()
Definition: partrans_setup.cpp:271
SetupTransferInfo::src_type
std::vector< int > src_type
Definition: partrans.hpp:96
multicore.hpp
coreneuron::nrn_partrans::TransferThreadData::insrc_indices
std::vector< int > insrc_indices
Definition: partrans.hpp:84
coreneuron::nrn_partrans::TransferThreadData
The basic problem is to copy sources to targets.
Definition: partrans.hpp:78
coreneuron::nrn_have_gaps
bool nrn_have_gaps
variables defined in coreneuron library
Definition: partrans.cpp:21
coreneuron::nrn_partrans::insrccnt_
int * insrccnt_
Definition: partrans.cpp:30
coreneuron::nrn_partrans::setup_info_
SetupTransferInfo * setup_info_
Definition: partrans_setup.cpp:23
sgid_t
int sgid_t
Definition: partrans.hpp:20
coreneuron::nrn_partrans::transfer_thread_data_
TransferThreadData * transfer_thread_data_
Definition: partrans.cpp:25
coreneuron::nrn_partrans::delete_gap_indices_from_device
void delete_gap_indices_from_device()
Definition: partrans.cpp:161