CoreNEURON
nrnran123.h
Go to the documentation of this file.
1 /*
2 # =============================================================================
3 # Copyright (c) 2016 - 2022 Blue Brain Project/EPFL
4 #
5 # See top-level LICENSE file for details.
6 # =============================================================================.
7 */
8 #pragma once
9 
10 /* interface to Random123 */
11 /* http://www.thesalmons.org/john/random123/papers/random123sc11.pdf */
12 
13 /*
14 The 4x32 generators utilize a uint32x4 counter and uint32x4 key to transform
15 into an almost cryptographic quality uint32x4 random result.
16 There are many possibilites for balancing the sharing of the internal
17 state instances while reserving a uint32 counter for the stream sequence
18 and reserving other portions of the counter vector for stream identifiers
19 and global index used by all streams.
20 
21 We currently provide a single instance by default in which the policy is
22 to use the 0th counter uint32 as the stream sequence, words 2 and 3 as the
23 stream identifier, and word 0 of the key as the global index. Unused words
24 are constant uint32 0.
25 
26 It is also possible to use Random123 directly without reference to this
27 interface. See Random123-1.02/docs/html/index.html
28 of the full distribution available from
29 http://www.deshawresearch.com/resources_random123.html
30 */
31 
32 #ifdef __bgclang__
33 #define R123_USE_MULHILO64_MULHI_INTRIN 0
34 #define R123_USE_GNU_UINT128 1
35 #endif
36 
38 
39 #include <Random123/philox.h>
40 #include <inttypes.h>
41 
42 #include <cmath>
43 
44 // Some files are compiled with DISABLE_OPENACC, and some builds have no GPU
45 // support at all. In these two cases, request that the random123 state is
46 // allocated using new/delete instead of CUDA unified memory.
47 #if defined(CORENEURON_ENABLE_GPU) && !defined(DISABLE_OPENACC)
48 #define CORENRN_RAN123_USE_UNIFIED_MEMORY true
49 #else
50 #define CORENRN_RAN123_USE_UNIFIED_MEMORY false
51 #endif
52 
53 namespace coreneuron {
54 
56  philox4x32_ctr_t c;
57  philox4x32_ctr_t r;
58  char which_;
59 };
60 
61 } // namespace coreneuron
62 
63 /** @brief Provide a helper function in global namespace that is declared target for OpenMP
64  * offloading to function correctly with NVHPC
65  */
66 nrn_pragma_acc(routine seq)
67 nrn_pragma_omp(declare target)
69 nrn_pragma_omp(end declare target)
70 
71 namespace coreneuron {
74 
75 /* global index. eg. run number */
76 /* all generator instances share this global index */
77 void nrnran123_set_globalindex(uint32_t gix);
78 uint32_t nrnran123_get_globalindex();
79 
80 // Utilities used for calculating model size, only called from the CPU.
81 std::size_t nrnran123_instance_count();
82 inline std::size_t nrnran123_state_size() {
83  return sizeof(nrnran123_State);
84 }
85 
86 /* routines for creating and deleting streams are called from cpu */
87 nrnran123_State* nrnran123_newstream3(uint32_t id1,
88  uint32_t id2,
89  uint32_t id3,
90  bool use_unified_memory = CORENRN_RAN123_USE_UNIFIED_MEMORY);
91 inline nrnran123_State* nrnran123_newstream(
92  uint32_t id1,
93  uint32_t id2,
94  bool use_unified_memory = CORENRN_RAN123_USE_UNIFIED_MEMORY) {
95  return nrnran123_newstream3(id1, id2, 0, use_unified_memory);
96 }
97 void nrnran123_deletestream(nrnran123_State* s,
98  bool use_unified_memory = CORENRN_RAN123_USE_UNIFIED_MEMORY);
99 
100 /* minimal data stream */
101 constexpr void nrnran123_getseq(nrnran123_State* s, uint32_t* seq, char* which) {
102  *seq = s->c.v[0];
103  *which = s->which_;
104 }
105 constexpr void nrnran123_getids(nrnran123_State* s, uint32_t* id1, uint32_t* id2) {
106  *id1 = s->c.v[2];
107  *id2 = s->c.v[3];
108 }
109 constexpr void nrnran123_getids3(nrnran123_State* s, uint32_t* id1, uint32_t* id2, uint32_t* id3) {
110  *id3 = s->c.v[1];
111  *id1 = s->c.v[2];
112  *id2 = s->c.v[3];
113 }
114 
115 // Uniform 0 to 2*32-1
116 inline uint32_t nrnran123_ipick(nrnran123_State* s) {
117  char which = s->which_;
118  uint32_t rval{s->r.v[int{which++}]};
119  if (which > 3) {
120  which = 0;
121  s->c.v[0]++;
123  }
124  s->which_ = which;
125  return rval;
126 }
127 
128 constexpr double nrnran123_uint2dbl(uint32_t u) {
129  constexpr double SHIFT32 = 1.0 / 4294967297.0; /* 1/(2^32 + 1) */
130  /* 0 to 2^32-1 transforms to double value in open (0,1) interval */
131  /* min 2.3283064e-10 to max (1 - 2.3283064e-10) */
132  return (static_cast<double>(u) + 1.0) * SHIFT32;
133 }
134 
135 // Uniform open interval (0,1), minimum value is 2.3283064e-10 and max value is 1-min
136 inline double nrnran123_dblpick(nrnran123_State* s) {
137  return nrnran123_uint2dbl(nrnran123_ipick(s));
138 }
139 
140 /* this could be called from openacc parallel construct (in INITIAL block) */
141 inline void nrnran123_setseq(nrnran123_State* s, uint32_t seq, char which) {
142  if (which > 3) {
143  s->which_ = 0;
144  } else {
145  s->which_ = which;
146  }
147  s->c.v[0] = seq;
149 }
150 
151 // nrnran123_negexp min value is 2.3283064e-10, max is 22.18071, mean 1.0
152 inline double nrnran123_negexp(nrnran123_State* s) {
153  return -std::log(nrnran123_dblpick(s));
154 }
155 
156 /* at cost of a cached value we could compute two at a time. */
157 inline double nrnran123_normal(nrnran123_State* s) {
158  double w, u1;
159  do {
160  u1 = nrnran123_dblpick(s);
161  double u2{nrnran123_dblpick(s)};
162  u1 = 2. * u1 - 1.;
163  u2 = 2. * u2 - 1.;
164  w = (u1 * u1) + (u2 * u2);
165  } while (w > 1);
166  double y{std::sqrt((-2. * std::log(w)) / w)};
167  return u1 * y;
168 }
169 
170 // nrnran123_gauss, nrnran123_iran were declared but not defined in CoreNEURON
171 // nrnran123_array4x32 was declared but not used in CoreNEURON
172 } // namespace coreneuron
coreneuron::nrnran123_get_globalindex
uint32_t nrnran123_get_globalindex()
Definition: nrnran123.cpp:108
coreneuron_random123_philox4x32_helper
CORENRN_HOST_DEVICE philox4x32_ctr_t coreneuron_random123_philox4x32_helper(coreneuron::nrnran123_State *s)
Definition: nrnran123.cpp:98
coreneuron::nrnran123_instance_count
std::size_t nrnran123_instance_count()
Definition: nrnran123.cpp:103
coreneuron::nrnran123_destroy_global_state_on_device
void nrnran123_destroy_global_state_on_device()
Definition: nrnran123.cpp:154
nrn_pragma_omp
nrn_pragma_acc(routine seq) nrn_pragma_omp(declare target) philox4x32_ctr_t coreneuron_random123_philox4x32_helper(coreneuron nrn_pragma_omp(end declare target) namespace coreneuron
Provide a helper function in global namespace that is declared target for OpenMP offloading to functi...
Definition: nrnran123.h:69
coreneuron::nrnran123_set_globalindex
void nrnran123_set_globalindex(uint32_t gix)
Definition: nrnran123.cpp:113
coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12
nrn_pragma_acc
#define nrn_pragma_acc(x)
Definition: offload.hpp:20
coreneuron::nrnran123_State::r
philox4x32_ctr_t r
Definition: nrnran123.h:57
coreneuron::nrnran123_deletestream
void nrnran123_deletestream(nrnran123_State *s, bool use_unified_memory)
Definition: nrnran123.cpp:201
coreneuron::nrnran123_newstream3
nrnran123_State * nrnran123_newstream3(uint32_t id1, uint32_t id2, uint32_t id3, bool use_unified_memory)
Allocate a new Random123 stream.
Definition: nrnran123.cpp:168
coreneuron::nrnran123_State::c
philox4x32_ctr_t c
Definition: nrnran123.h:56
coreneuron::nrnran123_initialise_global_state_on_device
void nrnran123_initialise_global_state_on_device()
Definition: nrnran123.cpp:146
coreneuron::nrnran123_State
Definition: nrnran123.h:55
offload.hpp
CORENRN_RAN123_USE_UNIFIED_MEMORY
#define CORENRN_RAN123_USE_UNIFIED_MEMORY
Definition: nrnran123.h:50
coreneuron::nrnran123_State::which_
char which_
Definition: nrnran123.h:58