175 grp =
new int[ngrp + 1];
176 (*nrn2core_group_ids_)(grp);
180 FILE* fp = fopen(filesdat,
"r");
183 nrn_fatal_error(
"No input file ( %s ) with nrnthreads, exiting...", filesdat);
191 nrn_assert(fscanf(fp,
"%d\n", &iNumFiles) == 1);
195 if (iNumFiles == -1) {
196 nrn_assert(fscanf(fp,
"%d\n", &iNumFiles) == 1);
199 printf(
"Model uses gap junctions\n");
205 "Info : The number of input datasets are less than ranks, some ranks will be idle!\n");
212 for (
int iNum = 0; iNum < iNumFiles; ++iNum) {
231 auto gid2out_it =
gid2out.find(gid);
232 if (gid2out_it !=
gid2out.end()) {
233 *ps = gid2out_it->second;
235 auto gid2in_it =
gid2in.find(gid);
236 if (gid2in_it !=
gid2in.end()) {
237 *psi = gid2in_it->second;
243 *ps = gid2out_it->second;
258 std::vector<InputPreSyn*> inputpresyn_;
271 auto gid2out_it =
gid2out.find(gid);
272 if (gid2out_it !=
gid2out.end()) {
274 ++gid2out_it->second->nc_cnt_;
277 auto gid2in_it =
gid2in.find(gid);
278 if (gid2in_it !=
gid2in.end()) {
280 ++gid2in_it->second->nc_cnt_;
288 inputpresyn_.push_back(psi);
292 if (!negsrcgid_tid.empty()) {
293 tid = negsrcgid_tid[i_tid++];
298 ++gid2out_it->second->nc_cnt_;
339 for (
auto psi: inputpresyn_) {
340 psi->nc_index_ = offset;
341 offset += psi->nc_cnt_;
345 inputpresyn_.clear();
368 if (!negsrcgid_tid.empty() && gid < -1) {
369 tid = negsrcgid_tid[i_tid++];
402 bool is_mapping_needed,
404 bool run_setup_cleanup,
406 const char* restore_path,
416 strlen(restore_path) == 0 ? datpath : restore_path,
431 pnttype2presyn.clear();
432 pnttype2presyn.resize(memb_func.size(), -1);
433 for (
size_t i = 0;
i < nrn_has_net_event_.size(); ++
i) {
434 pnttype2presyn[nrn_has_net_event_[
i]] =
i;
477 coreneuron::phase_wrapper<coreneuron::phase::one>(userParams);
482 p1.populate(nt,
mut);
494 coreneuron::phase_wrapper<coreneuron::phase::two>(userParams,
corenrn_embedded);
503 coreneuron::phase_wrapper<coreneuron::gap>(userParams);
518 if (is_mapping_needed)
519 coreneuron::phase_wrapper<coreneuron::phase::three>(userParams);
523 if (run_setup_cleanup)
544 size_t model_size_bytes;
554 printf(
" Setup Done : %.2lf seconds \n",
nrn_wtime() - time);
556 if (model_size_bytes < 1024) {
557 printf(
" Model size : %ld bytes\n", model_size_bytes);
558 }
else if (model_size_bytes < 1024 * 1024) {
559 printf(
" Model size : %.2lf kB\n", model_size_bytes / 1024.);
560 }
else if (model_size_bytes < 1024 * 1024 * 1024) {
561 printf(
" Model size : %.2lf MB\n", model_size_bytes / (1024. * 1024.));
563 printf(
" Model size : %.2lf GB\n", model_size_bytes / (1024. * 1024. * 1024.));
578 const std::lock_guard<OMP_Mutex> lock(
mut);
596 int sidt_size = F.read_int();
597 assert(sidt_size ==
int(
sizeof(
sgid_t)));
598 std::size_t ntar = F.read_int();
599 std::size_t nsrc = F.read_int();
603 si.src_type.resize(nsrc);
604 si.src_index.resize(nsrc);
606 F.read_array<
sgid_t>(si.src_sid.data(), nsrc);
607 F.read_array<
int>(si.src_type.data(), nsrc);
608 F.read_array<
int>(si.src_index.data(), nsrc);
611 si.tar_sid.resize(ntar);
612 si.tar_type.resize(ntar);
613 si.tar_index.resize(ntar);
615 F.read_array<
sgid_t>(si.tar_sid.data(), ntar);
616 F.read_array<
int>(si.tar_type.data(), ntar);
617 F.read_array<
int>(si.tar_index.data(), ntar);
621 printf(
"%d read_phasegap tid=%d nsrc=%d ntar=%d\n",
nrnmpi_myid, nt.
id, nsrc, ntar);
622 for (
int i = 0;
i < nsrc; ++
i) {
623 printf(
"src %z %d %d\n",
size_t(si.src_sid[
i]), si.src_type[
i], si.src_index[
i]);
625 for (
int i = 0;
i < ntar; ++
i) {
626 printf(
"tar %z %d %d\n",
size_t(si.src_sid[
i]), si.src_type[
i], si.src_index[
i]);
658 return ml->
data + ix;
659 }
else if (mtype == 0) {
662 printf(
"stdindex2ptr does not handle mtype=%d\n", mtype);
675 icnt =
i % padded_cnt;
676 isz =
i / padded_cnt;
739 (*s)(nt, ml, tml->index);
759 (*priv_dtor)(nt, ml, tml->index);
760 assert(!ml->instance);
761 assert(!ml->global_variables);
762 assert(ml->global_variables_size == 0);
785 if (tml->dependencies)
786 free(tml->dependencies);
788 next_tml = tml->
next;
921 p1.populate(nt,
mut);
938 F.restore_checkpoint();
945 F.read_mapping_cell_count(&count);
951 for (
int i = 0;
i < nt.
ncell;
i++) {
952 int gid, nsec, nseg, nseclist;
955 F.read_mapping_count(&gid, &nsec, &nseg, &nseclist);
960 for (
int j = 0; j < nseclist; j++) {
962 F.read_mapping_info(smap);
973 nt.
mapping = (
void*) ntmapping;
1011 printf(
"%s %d psize=%d ppsize=%d cnt=%d nbyte=%ld\n",
1030 printf(
" gid2out table bytes=~%ld size=%ld\n", nbyte,
gid2out.size());
1039 size_t nbyte =
sizeof(
gid2in) +
sizeof(
int) *
gid2in.size() +
1042 printf(
" gid2in table bytes=~%ld size=%ld\n", nbyte,
gid2in.size());
1049 size_t sz_nrnThread =
sizeof(
NrnThread);
1050 size_t sz_presyn =
sizeof(
PreSyn);
1052 size_t sz_netcon =
sizeof(
NetCon);
1056 std::vector<long> size_data(13, 0);
1057 std::vector<long> global_size_data_min(13, 0);
1058 std::vector<long> global_size_data_max(13, 0);
1059 std::vector<long> global_size_data_sum(13, 0);
1060 std::vector<float> global_size_data_avg(13, 0.0);
1069 for (
auto tml = nt.
tml; tml; tml = tml->
next) {
1075 nb_nt += sz_nrnThread;
1077 nb_nt += nt.
end *
sizeof(int);
1085 printf(
"ncell=%d end=%d nmech=%d\n", nt.
ncell, nt.
end, nmech);
1087 printf(
"nbyte so far %ld\n", nb_nt);
1088 printf(
"n_presyn = %d sz=%ld nbyte=%ld\n", nt.
n_presyn, sz_presyn, nt.
n_presyn * sz_presyn);
1089 printf(
"n_input_presyn = %d sz=%ld nbyte=%ld\n",
1093 printf(
"n_pntproc=%d sz=%ld nbyte=%ld\n",
1097 printf(
"n_netcon=%d sz=%ld nbyte=%ld\n", nt.
n_netcon, sz_netcon, nt.
n_netcon * sz_netcon);
1098 printf(
"n_weight = %d\n", nt.
n_weight);
1100 printf(
"%d thread %d total bytes %ld\n",
nrnmpi_myid,
i, nb_nt);
1103 if (detailed_report) {
1104 size_data[0] += nt.
ncell;
1105 size_data[1] += nt.
end;
1106 size_data[2] += nmech;
1107 size_data[3] += nt.
_ndata;
1115 size_data[11] += nb_nt;
1119 nbyte += nccnt *
sizeof(
NetCon*);
1126 printf(
"%d netcon pointers %ld nbyte=%ld\n",
nrnmpi_myid, nccnt, nccnt *
sizeof(
NetCon*));
1127 printf(
"nrnran123 size=%ld cnt=%ld nbyte=%ld\n",
1128 nrnran123_state_size(),
1131 printf(
"%d total bytes %ld\n",
nrnmpi_myid, nbyte);
1133 if (detailed_report) {
1134 size_data[12] = nbyte;
1141 for (
int i = 0;
i < 13;
i++) {
1147 global_size_data_max = size_data;
1148 global_size_data_min = size_data;
1149 global_size_data_avg.assign(size_data.cbegin(), size_data.cend());
1153 printf(
"Memory size information for all NrnThreads per rank\n");
1154 printf(
"------------------------------------------------------------------\n");
1155 printf(
"%22s %12s %12s %12s\n",
"field",
"min",
"max",
"avg");
1156 printf(
"%22s %12ld %12ld %15.2f\n",
1158 global_size_data_min[0],
1159 global_size_data_max[0],
1160 global_size_data_avg[0]);
1161 printf(
"%22s %12ld %12ld %15.2f\n",
1163 global_size_data_min[1],
1164 global_size_data_max[1],
1165 global_size_data_avg[1]);
1166 printf(
"%22s %12ld %12ld %15.2f\n",
1168 global_size_data_min[2],
1169 global_size_data_max[2],
1170 global_size_data_avg[2]);
1171 printf(
"%22s %12ld %12ld %15.2f\n",
1173 global_size_data_min[3],
1174 global_size_data_max[3],
1175 global_size_data_avg[3]);
1176 printf(
"%22s %12ld %12ld %15.2f\n",
1178 global_size_data_min[4],
1179 global_size_data_max[4],
1180 global_size_data_avg[4]);
1181 printf(
"%22s %12ld %12ld %15.2f\n",
1183 global_size_data_min[5],
1184 global_size_data_max[5],
1185 global_size_data_avg[5]);
1186 printf(
"%22s %12ld %12ld %15.2f\n",
1188 global_size_data_min[6],
1189 global_size_data_max[6],
1190 global_size_data_avg[6]);
1191 printf(
"%22s %12ld %12ld %15.2f\n",
1193 global_size_data_min[6] * sz_presyn,
1194 global_size_data_max[6] * sz_presyn,
1195 global_size_data_avg[6] * sz_presyn);
1196 printf(
"%22s %12ld %12ld %15.2f\n",
1198 global_size_data_min[7],
1199 global_size_data_max[7],
1200 global_size_data_avg[7]);
1201 printf(
"%22s %12ld %12ld %15.2f\n",
1202 "n_input_presyn (bytes)",
1203 global_size_data_min[7] * sz_input_presyn,
1204 global_size_data_max[7] * sz_input_presyn,
1205 global_size_data_avg[7] * sz_input_presyn);
1206 printf(
"%22s %12ld %12ld %15.2f\n",
1208 global_size_data_min[8],
1209 global_size_data_max[8],
1210 global_size_data_avg[8]);
1211 printf(
"%22s %12ld %12ld %15.2f\n",
1212 "n_pntproc (bytes)",
1213 global_size_data_min[8] * sz_pntproc,
1214 global_size_data_max[8] * sz_pntproc,
1215 global_size_data_avg[8] * sz_pntproc);
1216 printf(
"%22s %12ld %12ld %15.2f\n",
1218 global_size_data_min[9],
1219 global_size_data_max[9],
1220 global_size_data_avg[9]);
1221 printf(
"%22s %12ld %12ld %15.2f\n",
1223 global_size_data_min[9] * sz_netcon,
1224 global_size_data_max[9] * sz_netcon,
1225 global_size_data_avg[9] * sz_netcon);
1226 printf(
"%22s %12ld %12ld %15.2f\n",
1228 global_size_data_min[10],
1229 global_size_data_max[10],
1230 global_size_data_avg[10]);
1231 printf(
"%22s %12ld %12ld %15.2f\n",
1232 "NrnThread (bytes)",
1233 global_size_data_min[11],
1234 global_size_data_max[11],
1235 global_size_data_avg[11]);
1236 printf(
"%22s %12ld %12ld %15.2f\n",
1237 "model size (bytes)",
1238 global_size_data_min[12],
1239 global_size_data_max[12],
1240 global_size_data_avg[12]);
1246 long global_nbyte = 0;
1248 nbyte = global_nbyte;