CoreNEURON
fadvance_core.cpp
Go to the documentation of this file.
1 /*
2 # =============================================================================
3 # Copyright (c) 2016 - 2022 Blue Brain Project/EPFL
4 #
5 # See top-level LICENSE file for details.
6 # =============================================================================.
7 */
8 
9 #include <functional>
10 
12 #include "coreneuron/nrnconf.h"
15 #include "coreneuron/mpi/nrnmpi.h"
26 
27 namespace coreneuron {
28 static void* nrn_fixed_step_thread(NrnThread*);
29 static void nrn_fixed_step_group_thread(NrnThread*, int, int, int&);
30 
31 
32 namespace {
33 
34 class ProgressBar final {
36  int current_step = 0;
37  bool show;
38  constexpr static int progressbar_update_steps = 5;
39 
40  public:
41  ProgressBar(int nsteps)
42  : show(nrnmpi_myid == 0 && !corenrn_param.is_quiet()) {
43  if (show) {
44  printf("\n");
45  pbar = progressbar_new("psolve", nsteps);
46  }
47  }
48 
49  void update(int step, double time) {
50  current_step = step;
51  if (show && (current_step % progressbar_update_steps) == 0) {
53  }
54  }
55 
56  void step(double time) {
57  update(current_step + 1, time);
58  }
59 
60  ~ProgressBar() {
61  if (show) {
63  }
64  }
65 };
66 
67 } // unnamed namespace
68 
69 
70 void dt2thread(double adt) { /* copied from nrnoc/fadvance.c */
71  if (adt != nrn_threads[0]._dt) {
72  for (int i = 0; i < nrn_nthread; ++i) {
73  NrnThread* nt = nrn_threads + i;
74  nt->_t = t;
75  nt->_dt = dt;
76  if (secondorder) {
77  nt->cj = 2.0 / dt;
78  } else {
79  nt->cj = 1.0 / dt;
80  }
81  nrn_pragma_acc(update device(nt->_t, nt->_dt, nt->cj)
82  async(nt->stream_id) if (nt->compute_gpu))
83  // clang-format off
84  nrn_pragma_omp(target update to(nt->_t, nt->_dt, nt->cj)
85  if(nt->compute_gpu))
86  // clang-format on
87  }
88  }
89 }
90 
91 void nrn_fixed_step_minimal() { /* not so minimal anymore with gap junctions */
92  Instrumentor::phase p_timestep("timestep");
93  if (t != nrn_threads->_t) {
94  dt2thread(-1.);
95  } else {
96  dt2thread(dt);
97  }
100  if (nrn_have_gaps) {
101  {
102  Instrumentor::phase p_gap("gap-v-transfer");
104  }
106  }
107 #if NRNMPI
108  if (nrn_threads[0]._stop_stepping) {
110  }
111 #endif
112 
113 #if defined(ENABLE_BIN_REPORTS) || defined(ENABLE_SONATA_REPORTS)
114  {
115  Instrumentor::phase p("flush_reports");
117  }
118 #endif
119  t = nrn_threads[0]._t;
120 }
121 
122 /* better cache efficiency since a thread can do an entire minimum delay
123 integration interval before joining
124 */
125 /// --> Coreneuron
126 
127 
128 void nrn_fixed_single_steps_minimal(int total_sim_steps, double tstop) {
129  ProgressBar progress_bar(total_sim_steps);
130 #if NRNMPI
131  double updated_tstop = tstop - dt;
132  nrn_assert(nrn_threads->_t <= tstop);
133  // It may very well be the case that we do not advance at all
134  while (nrn_threads->_t <= updated_tstop) {
135 #else
136  double updated_tstop = tstop - .5 * dt;
137  while (nrn_threads->_t < updated_tstop) {
138 #endif
140  if (stoprun) {
141  break;
142  }
143  progress_bar.step(nrn_threads[0]._t);
144  }
145 }
146 
147 
148 void nrn_fixed_step_group_minimal(int total_sim_steps) {
149  dt2thread(dt);
151  int step_group_n = total_sim_steps;
152  int step_group_begin = 0;
153  int step_group_end = 0;
154 
155  ProgressBar progress_bar(step_group_n);
156  while (step_group_end < step_group_n) {
158  step_group_n,
159  step_group_begin,
160  step_group_end);
161 #if NRNMPI
163 #endif
164 
165 #if defined(ENABLE_BIN_REPORTS) || defined(ENABLE_SONATA_REPORTS)
166  {
167  Instrumentor::phase p("flush_reports");
169  }
170 #endif
171  if (stoprun) {
172  break;
173  }
174  step_group_begin = step_group_end;
175  progress_bar.update(step_group_end, nrn_threads[0]._t);
176  }
177  t = nrn_threads[0]._t;
178 }
179 
181  int step_group_max,
182  int step_group_begin,
183  int& step_group_end) {
184  nth->_stop_stepping = 0;
185  for (int i = step_group_begin; i < step_group_max; ++i) {
186  Instrumentor::phase p_timestep("timestep");
188  if (nth->_stop_stepping) {
189  if (nth->id == 0) {
190  step_group_end = i + 1;
191  }
192  nth->_stop_stepping = 0;
193  return;
194  }
195  }
196  if (nth->id == 0) {
197  step_group_end = step_group_max;
198  }
199 }
200 
201 void update(NrnThread* _nt) {
202  double* vec_v = &(VEC_V(0));
203  double* vec_rhs = &(VEC_RHS(0));
204  int i2 = _nt->end;
205 
206  /* do not need to worry about linmod or extracellular*/
207  if (secondorder) {
208  nrn_pragma_acc(parallel loop present(vec_v [0:i2], vec_rhs [0:i2]) if (_nt->compute_gpu)
209  async(_nt->stream_id))
210  nrn_pragma_omp(target teams distribute parallel for simd if(_nt->compute_gpu))
211  for (int i = 0; i < i2; ++i) {
212  vec_v[i] += 2. * vec_rhs[i];
213  }
214  } else {
215  nrn_pragma_acc(parallel loop present(vec_v [0:i2], vec_rhs [0:i2]) if (_nt->compute_gpu)
216  async(_nt->stream_id))
217  nrn_pragma_omp(target teams distribute parallel for simd if(_nt->compute_gpu))
218  for (int i = 0; i < i2; ++i) {
219  vec_v[i] += vec_rhs[i];
220  }
221  }
222 
223  if (_nt->tml) {
224  assert(_nt->tml->index == CAP);
225  nrn_cur_capacitance(_nt, _nt->tml->ml, _nt->tml->index);
226  }
227  if (nrn_use_fast_imem) {
228  nrn_calc_fast_imem(_nt);
229  }
230 }
231 
232 void nonvint(NrnThread* _nt) {
233  if (nrn_have_gaps) {
234  Instrumentor::phase p("gap-v-transfer");
236  }
237  errno = 0;
238 
239  Instrumentor::phase_begin("state-update");
240  for (auto tml = _nt->tml; tml; tml = tml->next)
241  if (corenrn.get_memb_func(tml->index).state) {
242  mod_f_t s = corenrn.get_memb_func(tml->index).state;
243  std::string ss("state-");
244  ss += nrn_get_mechname(tml->index);
245  {
246  Instrumentor::phase p(ss.c_str());
247  (*s)(_nt, tml->ml, tml->index);
248  }
249 #ifdef DEBUG
250  if (errno) {
251  hoc_warning("errno set during calculation of states", nullptr);
252  }
253 #endif
254  }
255  Instrumentor::phase_end("state-update");
256 }
257 
258 void nrn_ba(NrnThread* nt, int bat) {
259  for (auto tbl = nt->tbl[bat]; tbl; tbl = tbl->next) {
260  mod_f_t f = tbl->bam->f;
261  int type = tbl->bam->type;
262  Memb_list* ml = tbl->ml;
263  (*f)(nt, ml, type);
264  }
265 }
266 
268  if (nrn2core_trajectory_values_ == nullptr) {
269  // standalone execution : no callbacks
270  return;
271  }
272  // if per time step transfer, need to call nrn_record_init() in NEURON.
273  // if storing full trajectories in CoreNEURON, need to initialize
274  // vsize for all the trajectory requests.
275  (*nrn2core_trajectory_values_)(-1, 0, nullptr, 0.0);
276  for (int tid = 0; tid < nrn_nthread; ++tid) {
277  NrnThread& nt = nrn_threads[tid];
278  if (nt.trajec_requests) {
279  nt.trajec_requests->vsize = 0;
280  }
281  }
282 }
283 
285  if (nrn2core_trajectory_values_ == nullptr) {
286  // standalone execution : no callbacks
287  return;
288  }
289 
291  if (tr) {
292  if (tr->varrays) { // full trajectories into Vector data
293  int vs = tr->vsize++;
294  // make sure we do not overflow the `varrays` buffers
295  assert(vs < tr->bsize);
296 
297  nrn_pragma_acc(parallel loop present(tr [0:1]) if (nth->compute_gpu)
298  async(nth->stream_id))
299  nrn_pragma_omp(target teams distribute parallel for simd if(nth->compute_gpu))
300  for (int i = 0; i < tr->n_trajec; ++i) {
301  tr->varrays[i][vs] = *tr->gather[i];
302  }
303  } else if (tr->scatter) { // scatter to NEURON and notify each step.
305  // Note that this is rather inefficient: we generate one `acc update
306  // self` call for each `double` value (voltage, membrane current,
307  // mechanism property, ...) that is being recorded, even though in most
308  // cases these values will actually fall in a small number of contiguous
309  // ranges in memory. A better solution, if the performance of this
310  // branch becomes limiting, might be to offload this loop to the
311  // device and populate some `scatter_values` array there and copy it
312  // back with a single transfer. Note that the `async` clause here
313  // should guarantee that correct values are reported even of
314  // mechanism data that is updated in `nrn_state`. See also:
315  // https://github.com/BlueBrain/CoreNeuron/issues/611
316  for (int i = 0; i < tr->n_trajec; ++i) {
317  double* gather_i = tr->gather[i];
318  static_cast<void>(gather_i);
319  nrn_pragma_acc(update self(gather_i [0:1]) if (nth->compute_gpu)
320  async(nth->stream_id))
321  nrn_pragma_omp(target update from(gather_i [0:1]) if (nth->compute_gpu))
322  }
323  nrn_pragma_acc(wait(nth->stream_id))
324  for (int i = 0; i < tr->n_trajec; ++i) {
325  *(tr->scatter[i]) = *(tr->gather[i]);
326  }
327  (*nrn2core_trajectory_values_)(nth->id, tr->n_pr, tr->vpr, nth->_t);
328  }
329  }
330 }
331 
332 static void* nrn_fixed_step_thread(NrnThread* nth) {
333  /* check thresholds and deliver all (including binqueue)
334  events up to t+dt/2 */
335  {
336  Instrumentor::phase p("deliver-events");
337  deliver_net_events(nth);
338  }
339 
340  nth->_t += .5 * nth->_dt;
341 
342  if (nth->ncell) {
343  /*@todo: do we need to update nth->_t on GPU: Yes (Michael, but can
344  launch kernel) */
345  nrn_pragma_acc(update device(nth->_t) if (nth->compute_gpu) async(nth->stream_id))
346  nrn_pragma_acc(wait(nth->stream_id))
347  nrn_pragma_omp(target update to(nth->_t) if (nth->compute_gpu))
349 
350  {
351  Instrumentor::phase p("setup-tree-matrix");
353  }
354 
355  {
356  Instrumentor::phase p("matrix-solver");
357  nrn_solve_minimal(nth);
358  }
359 
360  {
361  Instrumentor::phase p("second-order-cur");
363  }
364 
365  {
366  Instrumentor::phase p("update");
367  update(nth);
368  }
369  }
370  if (!nrn_have_gaps) {
372  }
373  return nullptr;
374 }
375 
377  nth->_t += .5 * nth->_dt;
378 
379  if (nth->ncell) {
380  /*@todo: do we need to update nth->_t on GPU */
381  nrn_pragma_acc(update device(nth->_t) if (nth->compute_gpu) async(nth->stream_id))
382  nrn_pragma_acc(wait(nth->stream_id))
383  nrn_pragma_omp(target update to(nth->_t) if (nth->compute_gpu))
385  nonvint(nth);
386  nrn_ba(nth, AFTER_SOLVE);
387  nrn_ba(nth, BEFORE_STEP);
388  nrncore2nrn_send_values(nth); // consistent with NEURON. (after BEFORE_STEP)
389  } else {
391  }
392 
393  {
394  Instrumentor::phase p("deliver-events");
395  nrn_deliver_events(nth); /* up to but not past texit */
396  }
397 
398  return nullptr;
399 }
400 } // namespace coreneuron
VEC_RHS
#define VEC_RHS(i)
Definition: nrnconf.h:30
coreneuron::nrn_calc_fast_imem
void nrn_calc_fast_imem(NrnThread *nt)
Definition: fast_imem.cpp:44
coreneuron::nrn_fixed_step_thread
static void * nrn_fixed_step_thread(NrnThread *)
Definition: fadvance_core.cpp:332
coreneuron::nrn_spike_exchange
void nrn_spike_exchange(NrnThread *nt)
coreneuron::nrn_nthread
int nrn_nthread
Definition: multicore.cpp:55
coreneuron::nrncore2nrn_send_init
void nrncore2nrn_send_init()
Definition: fadvance_core.cpp:267
coreneuron::nrn_fixed_single_steps_minimal
void nrn_fixed_single_steps_minimal(int total_sim_steps, double tstop)
--> Coreneuron
Definition: fadvance_core.cpp:128
nrn2core_direct.h
coreneuron::TrajectoryRequests::vsize
int vsize
Definition: multicore.hpp:65
progressbar_finish
void progressbar_finish(progressbar *bar)
Finish a progressbar, indicating 100% completion, and free it.
Definition: progressbar.cpp:245
coreneuron::dt2thread
void dt2thread(double adt)
Definition: fadvance_core.cpp:70
coreneuron::NrnThread::_t
double _t
Definition: multicore.hpp:76
coreneuron::nrn_use_fast_imem
bool nrn_use_fast_imem
Definition: fast_imem.cpp:19
nrnoc_aux.hpp
coreneuron::CoreNeuron::get_memb_func
auto & get_memb_func(size_t idx)
Definition: coreneuron.hpp:138
progressbar_update
void progressbar_update(progressbar *bar, unsigned long value, double t)
Increment an existing progressbar by value steps.
Definition: progressbar.cpp:110
coreneuron::nrn_ba
void nrn_ba(NrnThread *nt, int bat)
Definition: fadvance_core.cpp:258
coreneuron::TrajectoryRequests::n_trajec
int n_trajec
Definition: multicore.hpp:63
coreneuron::setup_tree_matrix_minimal
void * setup_tree_matrix_minimal(NrnThread *)
Definition: treeset_core.cpp:178
nrn_acc_manager.hpp
coreneuron::NrnThread::cj
double cj
Definition: multicore.hpp:78
coreneuron::NrnThread::id
int id
Definition: multicore.hpp:99
nrn_pragma_omp
nrn_pragma_acc(routine seq) nrn_pragma_omp(declare target) philox4x32_ctr_t coreneuron_random123_philox4x32_helper(coreneuron nrn_pragma_omp(end declare target) namespace coreneuron
Provide a helper function in global namespace that is declared target for OpenMP offloading to functi...
Definition: nrnran123.h:69
progressbar
Progressbar data structure (do not modify or create directly)
Definition: progressbar.hpp:21
coreneuron::nrn_solve_minimal
void nrn_solve_minimal(NrnThread *)
Definition: solve_core.cpp:18
netcvode.hpp
coreneuron::Memb_list
Definition: mechanism.hpp:131
coreneuron::Instrumentor::phase_begin
static void phase_begin(const char *name)
Definition: profiler_interface.h:308
coreneuron::NrnThread::tml
NrnThreadMembList * tml
Definition: multicore.hpp:80
coreneuron::NrnThreadMembList::index
int index
Definition: multicore.hpp:35
coreneuron::hoc_warning
void hoc_warning(const char *s1, const char *s2)
Definition: nrnoc_aux.cpp:44
coreneuron::NrnThread::compute_gpu
int compute_gpu
Definition: multicore.hpp:136
profiler_interface.h
VEC_V
#define VEC_V(i)
Definition: nrnconf.h:31
coreneuron.hpp
coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12
coreneuron::NrnThread::trajec_requests
TrajectoryRequests * trajec_requests
Definition: multicore.hpp:146
fast_imem.hpp
coreneuron::nrn_fixed_step_minimal
void nrn_fixed_step_minimal()
Definition: fadvance_core.cpp:91
coreneuron::t
double t
Definition: register_mech.cpp:22
corenrn_parameters.hpp
coreneuron::NrnThread::tbl
NrnThreadBAList * tbl[BEFORE_AFTER_SIZE]
Definition: multicore.hpp:133
coreneuron::i
int i
Definition: cellorder.cpp:485
coreneuron::NrnThread::_dt
double _dt
Definition: multicore.hpp:77
coreneuron::update
void update(NrnThread *_nt)
Definition: fadvance_core.cpp:201
coreneuron::dt
double dt
Definition: register_mech.cpp:22
coreneuron::nrn_multithread_job
void nrn_multithread_job(F &&job, Args &&... args)
Definition: multicore.hpp:161
nrn2core_trajectory_values_
void(* nrn2core_trajectory_values_)(int tid, int n_pr, void **vpr, double t)
Definition: nrn_setup.cpp:67
coreneuron::TrajectoryRequests::scatter
double ** scatter
Definition: multicore.hpp:59
progressbar_new
progressbar * progressbar_new(const char *label, unsigned long max)
Create a new progress bar with the specified label and max number of steps.
Definition: progressbar.cpp:88
coreneuron::NrnThread::_stop_stepping
int _stop_stepping
Definition: multicore.hpp:100
coreneuron::mod_f_t
void(*)(NrnThread *, Memb_list *, int) mod_f_t
Definition: membfunc.hpp:24
progressbar_update_steps
constexpr static int progressbar_update_steps
Definition: fadvance_core.cpp:38
coreneuron::NrnThread
Definition: multicore.hpp:75
coreneuron::TrajectoryRequests::varrays
double ** varrays
Definition: multicore.hpp:60
coreneuron::NrnThreadBAList::next
NrnThreadBAList * next
Definition: multicore.hpp:49
coreneuron::Instrumentor::phase
Definition: profiler_interface.h:289
coreneuron::nrn_flush_reports
void nrn_flush_reports(double t)
Definition: nrnreport.cpp:36
coreneuron::nrncore2nrn_send_values
void nrncore2nrn_send_values(NrnThread *nth)
Definition: fadvance_core.cpp:284
partrans.hpp
coreneuron::corenrn_param
corenrn_parameters corenrn_param
Printing method.
Definition: corenrn_parameters.cpp:268
coreneuron::NrnThread::stream_id
int stream_id
Definition: multicore.hpp:137
coreneuron::TrajectoryRequests::vpr
void ** vpr
Definition: multicore.hpp:58
coreneuron::nrn_threads
NrnThread * nrn_threads
Definition: multicore.cpp:56
coreneuron::corenrn
CoreNeuron corenrn
Definition: multicore.cpp:53
coreneuron::TrajectoryRequests
Definition: multicore.hpp:57
AFTER_SOLVE
#define AFTER_SOLVE
Definition: membfunc.hpp:70
coreneuron::deliver_net_events
void deliver_net_events(NrnThread *nt)
Definition: cvodestb.cpp:24
coreneuron::nrnmpi_v_transfer
void nrnmpi_v_transfer()
Definition: partrans.cpp:35
coreneuron::second_order_cur
void second_order_cur(NrnThread *_nt, int secondorder)
nrnconf.h
coreneuron::nrn_fixed_step_group_minimal
void nrn_fixed_step_group_minimal(int total_sim_steps)
Definition: fadvance_core.cpp:148
coreneuron::nrn_cur_capacitance
void nrn_cur_capacitance(NrnThread *_nt, Memb_list *ml, int type)
Definition: capac.cpp:101
coreneuron::nrn_fixed_step_group_thread
static void nrn_fixed_step_group_thread(NrnThread *, int, int, int &)
Definition: fadvance_core.cpp:180
nrnreport.hpp
coreneuron::NrnThreadMembList::next
NrnThreadMembList * next
Definition: multicore.hpp:33
coreneuron::TrajectoryRequests::n_pr
int n_pr
Definition: multicore.hpp:62
coreneuron::nrn_get_mechname
const char * nrn_get_mechname(int type)
Definition: mk_mech.cpp:145
show
bool show
Definition: fadvance_core.cpp:37
coreneuron::nrnthread_v_transfer
void nrnthread_v_transfer(NrnThread *_nt)
Definition: partrans.cpp:108
current_step
int current_step
Definition: fadvance_core.cpp:36
pbar
progressbar * pbar
Definition: fadvance_core.cpp:35
CAP
#define CAP
Definition: membfunc.hpp:60
multicore.hpp
coreneuron::secondorder
int secondorder
Definition: register_mech.cpp:21
progressbar.hpp
coreneuron::nonvint
void nonvint(NrnThread *_nt)
Definition: fadvance_core.cpp:232
coreneuron::nrn_fixed_step_lastpart
void * nrn_fixed_step_lastpart(NrnThread *nth)
Definition: fadvance_core.cpp:376
netpar.hpp
coreneuron::nrn_have_gaps
bool nrn_have_gaps
variables defined in coreneuron library
Definition: partrans.cpp:21
coreneuron::nrnmpi_myid
int nrnmpi_myid
Definition: nrnmpi_def_cinc.cpp:11
coreneuron::TrajectoryRequests::gather
double ** gather
Definition: multicore.hpp:61
coreneuron::NrnThread::end
int end
Definition: multicore.hpp:98
coreneuron::nrn_pragma_acc
nrn_pragma_acc(routine vector) static void triang_interleaved2(NrnThread *nt
Definition: ivocvect.cpp:30
coreneuron::if
if(ncell==0)
Definition: cellorder.cpp:637
coreneuron::nrn_thread_table_check
void nrn_thread_table_check()
Definition: multicore.cpp:168
nrn_assert
#define nrn_assert(x)
assert()-like macro, independent of NDEBUG status
Definition: nrn_assert.h:33
coreneuron::nrn_deliver_events
void nrn_deliver_events(NrnThread *nt)
Definition: cvodestb.cpp:32
coreneuron::NrnThreadMembList::ml
Memb_list * ml
Definition: multicore.hpp:34
coreneuron::Instrumentor::phase_end
static void phase_end(const char *name)
Definition: profiler_interface.h:312
nrnmpi.h
coreneuron::NrnThread::ncell
int ncell
Definition: multicore.hpp:97
BEFORE_STEP
#define BEFORE_STEP
Definition: membfunc.hpp:71
coreneuron::fixed_play_continuous
void fixed_play_continuous(NrnThread *nt)
Definition: cvodestb.cpp:81
coreneuron::stoprun
bool stoprun
Definition: nrnoc_aux.cpp:19