3466/doxygen/nrn__setup_8cpp_source.html

 /*

 # =============================================================================

 # Copyright (c) 2016 - 2021 Blue Brain Project/EPFL

 #

 # See top-level LICENSE file for details.

 # =============================================================================.

 */


 #include <algorithm>

 #include <vector>

 #include <map>

 #include <cstring>

 #include <mutex>


 #include "coreneuron/apps/corenrn_parameters.hpp"

 #include "coreneuron/nrnconf.h"

 #include "coreneuron/utils/randoms/nrnran123.h"

 #include "coreneuron/sim/multicore.hpp"

 #include "coreneuron/nrniv/nrniv_decl.h"

 #include "coreneuron/sim/fast_imem.hpp"

 #include "coreneuron/network/multisend.hpp"

 #include "coreneuron/utils/nrn_assert.h"

 #include "coreneuron/utils/nrnmutdec.hpp"

 #include "coreneuron/utils/memory.h"

 #include "coreneuron/utils/utils.hpp"

 #include "coreneuron/mpi/nrnmpi.h"

 #include "coreneuron/mpi/core/nrnmpi.hpp"

 #include "coreneuron/io/nrn_setup.hpp"

 #include "coreneuron/network/partrans.hpp"

 #include "coreneuron/io/nrn_checkpoint.hpp"

 #include "coreneuron/permute/node_permute.h"

 #include "coreneuron/permute/cellorder.hpp"

 #include "coreneuron/io/nrnsection_mapping.hpp"

 #include "coreneuron/utils/nrnoc_aux.hpp"

 #include "coreneuron/io/phase1.hpp"

 #include "coreneuron/io/phase2.hpp"

 #include "coreneuron/io/phase3.hpp"

 #include "coreneuron/io/mech_report.h"

 #include "coreneuron/io/reports/nrnreport.hpp"


 // callbacks into nrn/src/nrniv/nrnbbcore_write.cpp

 #include "coreneuron/sim/fast_imem.hpp"

 #include "coreneuron/coreneuron.hpp"


 /// --> Coreneuron

 bool corenrn_embedded;

 bool corenrn_file_mode;

 int corenrn_embedded_nthread;


 void (*nrn2core_group_ids_)(int*);


 extern "C" {

 SetupTransferInfo* (*nrn2core_get_partrans_setup_info_)(int ngroup,

                                                         int cn_nthread,

                                                         size_t cn_sidt_size);

 }


 void (*nrn2core_get_trajectory_requests_)(int tid,

                                           int& bsize,

                                           int& n_pr,

                                           void**& vpr,

                                           int& n_trajec,

                                           int*& types,

                                           int*& indices,

                                           double**& pvars,

                                           double**& varrays);


 void (*nrn2core_trajectory_values_)(int tid, int n_pr, void** vpr, double t);


 void (*nrn2core_trajectory_return_)(int tid, int n_pr, int bsize, int vecsz, void** vpr, double t);


 int (*nrn2core_all_spike_vectors_return_)(std::vector<double>& spikevec, std::vector<int>& gidvec);


 void (*nrn2core_all_weights_return_)(std::vector<double*>& weights);


 // file format defined in cooperation with nrncore/src/nrniv/nrnbbcore_write.cpp

 // single integers are ascii one per line. arrays are binary int or double

 // Note that regardless of the gid contents of a group, since all gids are

 // globally unique, a filename convention which involves the first gid

 // from the group is adequate. Also note that balance is carried out from a

 // per group perspective and launching a process consists of specifying

 // a list of group ids (first gid of the group) for each process.

 //

 // <firstgid>_1.dat

 // n_presyn, n_netcon

 // output_gids (npresyn) with -(type+1000*index) for those acell with no gid

 // netcon_srcgid (nnetcon) -(type+1000*index) refers to acell with no gid

 //                         -1 means the netcon has no source (not implemented)

 // Note that the negative gids are only thread unique and not process unique.

 // We create a thread specific hash table for the negative gids for each thread

 // when <firstgid>_1.dat is read and then destroy it after <firstgid>_2.dat

 // is finished using it.  An earlier implementation which attempted to

 // encode the thread number into the negative gid

 // (i.e -ith - nth*(type +1000*index)) failed due to not large enough

 // integer domain size.

 // Note that for file transfer it is an error if a negative srcgid is

 // not in the same thread as the target. This is because there it may

 // not be the case that threads in a NEURON process end up on same process

 // in CoreNEURON. NEURON will raise an error if this

 // is the case. However, for direct memory transfer, it is allowed that

 // a negative srcgid may be in a different thread than the target. So

 // nrn2core_get_dat1 has a last arg netcon_negsrcgid_tid that specifies

 // for the negative gids in netcon_srcgid (in that order) the source thread.

 //

 // <firstgid>_2.dat

 // n_real_cell, n_output, n_real_output, nnode

 // ndiam - 0 if no mechanism has dparam with diam semantics, or nnode

 // nmech - includes artcell mechanisms

 // for the nmech tml mechanisms

 //   type, nodecount

 // nidata, nvdata, nweight

 // v_parent_index (nnode)

 // actual_a, b, area, v (nnode)

 // diam - if ndiam > 0. Note that only valid diam is for those nodes with diam semantics mechanisms

 // for the nmech tml mechanisms

 //   nodeindices (nodecount) but only if not an artificial cell

 //   data (nodecount*param_size)

 //   pdata (nodecount*dparam_size) but only if dparam_size > 0 on this side.

 // output_vindex (n_presyn) >= 0 associated with voltages -(type+1000*index) for acell

 // output_threshold (n_real_output)

 // netcon_pnttype (nnetcon) <=0 if a NetCon does not have a target.

 // netcon_pntindex (nnetcon)

 // weights (nweight)

 // delays (nnetcon)

 // for the nmech tml mechanisms that have a nrn_bbcore_write method

 //   type

 //   icnt

 //   dcnt

 //   int array (number specified by the nodecount nrn_bbcore_write

 //     to be intepreted by this side's nrn_bbcore_read method)

 //   double array

 // #VectorPlay_instances, for each of these instances

 // 4 (VecPlayContinuousType)

 // mtype

 // index (from Memb_list.data)

 // vecsize

 // yvec

 // tvec

 //

 // The critical issue requiring careful attention is that a coreneuron

 // process reads many coreneuron thread files with a result that, although

 // the conceptual

 // total n_pre is the sum of all the n_presyn from each thread as is the

 // total number of output_gid, the number of InputPreSyn instances must

 // be computed here from a knowledge of all thread's netcon_srcgid after

 // all thread's output_gids have been registered. We want to save the

 // "individual allocation of many small objects" memory overhead by

 // allocating a single InputPreSyn array for the entire process.

 // For this reason cellgroup data are divided into two separate

 // files with the first containing output_gids and netcon_srcgid which are

 // stored in the nt.presyns array and nt.netcons array respectively

 namespace coreneuron {

 static OMP_Mutex mut;


 /// Vector of maps for negative presyns

 std::vector<std::map<int, PreSyn*>> neg_gid2out;

 /// Maps for ouput and input presyns

 std::map<int, PreSyn*> gid2out;

 std::map<int, InputPreSyn*> gid2in;


 /// InputPreSyn.nc_index_ to + InputPreSyn.nc_cnt_ give the NetCon*

 std::vector<NetCon*> netcon_in_presyn_order_;


 /// Only for setup vector of netcon source gids

 std::vector<int*> nrnthreads_netcon_srcgid;


 /// If a nrnthreads_netcon_srcgid is negative, need to determine the thread when

 /// in order to use the correct neg_gid2out[tid] map

 std::vector<std::vector<int>> nrnthreads_netcon_negsrcgid_tid;


 /* read files.dat file and distribute cellgroups to all mpi ranks */

 void nrn_read_filesdat(int& ngrp, int*& grp, const char* filesdat) {

     patstimtype = nrn_get_mechtype("PatternStim");

     if (corenrn_embedded && !corenrn_file_mode) {

         ngrp = corenrn_embedded_nthread;

         grp = new int[ngrp + 1];

         (*nrn2core_group_ids_)(grp);

         return;

     }


     FILE* fp = fopen(filesdat, "r");


     if (!fp) {

         nrn_fatal_error("No input file ( %s ) with nrnthreads, exiting...", filesdat);

     }


     char version[256];

     nrn_assert(fscanf(fp, "%s\n", version) == 1);

     check_bbcore_write_version(version);


     int iNumFiles = 0;

     nrn_assert(fscanf(fp, "%d\n", &iNumFiles) == 1);


     // temporary strategem to figure out if model uses gap junctions while

     // being backward compatible

     if (iNumFiles == -1) {

         nrn_assert(fscanf(fp, "%d\n", &iNumFiles) == 1);

         nrn_have_gaps = true;

         if (nrnmpi_myid == 0) {

             printf("Model uses gap junctions\n");

         }

     }


     if (nrnmpi_numprocs > iNumFiles && nrnmpi_myid == 0) {

         printf(

             "Info : The number of input datasets are less than ranks, some ranks will be idle!\n");

     }


     ngrp = 0;

     grp = new int[iNumFiles / nrnmpi_numprocs + 1];


     // irerate over gids in files.dat

     for (int iNum = 0; iNum < iNumFiles; ++iNum) {

         int iFile;


         nrn_assert(fscanf(fp, "%d\n", &iFile) == 1);

         if ((iNum % nrnmpi_numprocs) == nrnmpi_myid) {

             // A "-1" entry means that this rank should not be assigned further gid groups.

             // It is a way to create files.dat files which deterministically assign gid groups to

             // ranks, particularly useful for very large simulations which required load balancing.

             if (iFile == -1) {

                 break;

             }

             grp[ngrp] = iFile;

             ngrp++;

         }

     }


     fclose(fp);

 }


 void netpar_tid_gid2ps(int tid, int gid, PreSyn** ps, InputPreSyn** psi) {

     /// for gid < 0 returns the PreSyn* in the thread (tid) specific map.

     *ps = nullptr;

     *psi = nullptr;


     if (gid >= 0) {

         auto gid2out_it = gid2out.find(gid);

         if (gid2out_it != gid2out.end()) {

             *ps = gid2out_it->second;

         } else {

             auto gid2in_it = gid2in.find(gid);

             if (gid2in_it != gid2in.end()) {

                 *psi = gid2in_it->second;

             }

         }

     } else {

         auto gid2out_it = neg_gid2out[tid].find(gid);

         if (gid2out_it != neg_gid2out[tid].end()) {

             *ps = gid2out_it->second;

         }

     }

 }


 void determine_inputpresyn() {

     // allocate the process wide InputPreSyn array

     // all the output_gid have been registered and associated with PreSyn.

     // now count the needed InputPreSyn by filling the netpar::gid2in map

     gid2in.clear();


     // now have to fill the new table

     // do not need to worry about negative gid overlap since only use

     // it to search for PreSyn in this thread.


     std::vector<InputPreSyn*> inputpresyn_;


     for (int ith = 0; ith < nrn_nthread; ++ith) {

         NrnThread& nt = nrn_threads[ith];

         // associate gid with InputPreSyn and increase PreSyn and InputPreSyn count

         nt.n_input_presyn = 0;

         // if single thread or file transfer then definitely empty.

         std::vector<int>& negsrcgid_tid = nrnthreads_netcon_negsrcgid_tid[ith];

         size_t i_tid = 0;

         for (int i = 0; i < nt.n_netcon; ++i) {

             int gid = nrnthreads_netcon_srcgid[ith][i];

             if (gid >= 0) {

                 /// If PreSyn or InputPreSyn is already in the map

                 auto gid2out_it = gid2out.find(gid);

                 if (gid2out_it != gid2out.end()) {

                     /// Increase PreSyn count

                     ++gid2out_it->second->nc_cnt_;

                     continue;

                 }

                 auto gid2in_it = gid2in.find(gid);

                 if (gid2in_it != gid2in.end()) {

                     /// Increase InputPreSyn count

                     ++gid2in_it->second->nc_cnt_;

                     continue;

                 }


                 /// Create InputPreSyn and increase its count

                 InputPreSyn* psi = new InputPreSyn;

                 ++psi->nc_cnt_;

                 gid2in[gid] = psi;

                 inputpresyn_.push_back(psi);

                 ++nt.n_input_presyn;

             } else {

                 int tid = nt.id;

                 if (!negsrcgid_tid.empty()) {

                     tid = negsrcgid_tid[i_tid++];

                 }

                 auto gid2out_it = neg_gid2out[tid].find(gid);

                 if (gid2out_it != neg_gid2out[tid].end()) {

                     /// Increase negative PreSyn count

                     ++gid2out_it->second->nc_cnt_;

                 }

             }

         }

     }


     // now, we can opportunistically create the NetCon* pointer array

     // to save some memory overhead for

     // "large number of small array allocation" by

     // counting the number of NetCons each PreSyn and InputPreSyn point to.

     // Conceivably the nt.netcons could become a process global array

     // in which case the NetCon* pointer array could become an integer index

     // array. More speculatively, the index array could be eliminated itself

     // if the process global NetCon array were ordered properly but that

     // would interleave NetCon from different threads. Not a problem for

     // serial threads but the reordering would propagate to nt.pntprocs

     // if the NetCon data pointers are also replaced by integer indices.


     // First, allocate the pointer array.

     int n_nc = 0;

     for (int ith = 0; ith < nrn_nthread; ++ith) {

         n_nc += nrn_threads[ith].n_netcon;

     }

     netcon_in_presyn_order_.resize(n_nc);

     n_nc = 0;


     // fill the indices with the offset values and reset the nc_cnt_

     // such that we use the nc_cnt_ in the following loop to assign the NetCon

     // to the right place

     // for PreSyn

     int offset = 0;

     for (int ith = 0; ith < nrn_nthread; ++ith) {

         NrnThread& nt = nrn_threads[ith];

         for (int i = 0; i < nt.n_presyn; ++i) {

             PreSyn& ps = nt.presyns[i];

             ps.nc_index_ = offset;

             offset += ps.nc_cnt_;

             ps.nc_cnt_ = 0;

         }

     }

     // for InputPreSyn

     for (auto psi: inputpresyn_) {

         psi->nc_index_ = offset;

         offset += psi->nc_cnt_;

         psi->nc_cnt_ = 0;

     }


     inputpresyn_.clear();


     // with gid to InputPreSyn and PreSyn maps we can setup the multisend

     // target lists.

     if (use_multisend_) {

 #if NRN_MULTISEND

         nrn_multisend_setup();

 #endif

     }


     // fill the netcon_in_presyn_order and recompute nc_cnt_

     // note that not all netcon_in_presyn will be filled if there are netcon

     // with no presyn (ie. nrnthreads_netcon_srcgid[nt.id][i] = -1) but that is ok since they are

     // only used via ps.nc_index_ and ps.nc_cnt_;

     for (int ith = 0; ith < nrn_nthread; ++ith) {

         NrnThread& nt = nrn_threads[ith];

         // if single thread or file transfer then definitely empty.

         std::vector<int>& negsrcgid_tid = nrnthreads_netcon_negsrcgid_tid[ith];

         size_t i_tid = 0;

         for (int i = 0; i < nt.n_netcon; ++i) {

             NetCon* nc = nt.netcons + i;

             int gid = nrnthreads_netcon_srcgid[ith][i];

             int tid = ith;

             if (!negsrcgid_tid.empty() && gid < -1) {

                 tid = negsrcgid_tid[i_tid++];

             }

             PreSyn* ps;

             InputPreSyn* psi;

             netpar_tid_gid2ps(tid, gid, &ps, &psi);

             if (ps) {

                 netcon_in_presyn_order_[ps->nc_index_ + ps->nc_cnt_] = nc;

                 ++ps->nc_cnt_;

                 ++n_nc;

             } else if (psi) {

                 netcon_in_presyn_order_[psi->nc_index_ + psi->nc_cnt_] = nc;

                 ++psi->nc_cnt_;

                 ++n_nc;

             }

         }

     }


     /// Resize the vector to its actual size of the netcons put in it

     netcon_in_presyn_order_.resize(n_nc);

 }


 /// Clean up

 void nrn_setup_cleanup() {

     for (int ith = 0; ith < nrn_nthread; ++ith) {

         if (nrnthreads_netcon_srcgid[ith])

             delete[] nrnthreads_netcon_srcgid[ith];

     }

     nrnthreads_netcon_srcgid.clear();

     nrnthreads_netcon_negsrcgid_tid.clear();

     neg_gid2out.clear();

 }


 void nrn_setup(const char* filesdat,

                bool is_mapping_needed,

                CheckPoints& checkPoints,

                bool run_setup_cleanup,

                const char* datpath,

                const char* restore_path,

                double* mindelay) {

     double time = nrn_wtime();


     int ngroup;

     int* gidgroups;

     nrn_read_filesdat(ngroup, gidgroups, filesdat);

     UserParams userParams(ngroup,

                           gidgroups,

                           datpath,

                           strlen(restore_path) == 0 ? datpath : restore_path,

                           checkPoints);


     // temporary bug work around. If any process has multiple threads, no

     // process can have a single thread. So, for now, if one thread, make two.

     // Fortunately, empty threads work fine.

     // Allocate NrnThread* nrn_threads of size ngroup (minimum 2)

     // Note that rank with 0 dataset/cellgroup works fine

     nrn_threads_create(userParams.ngroup <= 1 ? 2 : userParams.ngroup);


     // from nrn_has_net_event create pnttype2presyn for use in phase2.

     auto& memb_func = corenrn.get_memb_funcs();

     auto& pnttype2presyn = corenrn.get_pnttype2presyn();

     auto& nrn_has_net_event_ = corenrn.get_has_net_event();

     pnttype2presyn.clear();

     pnttype2presyn.resize(memb_func.size(), -1);

     for (size_t i = 0; i < nrn_has_net_event_.size(); ++i) {

         pnttype2presyn[nrn_has_net_event_[i]] = i;

     }


     nrnthread_chkpnt = new NrnThreadChkpnt[nrn_nthread];


     if (nrn_nthread > 1) {

         // NetCvode construction assumed one thread. Need nrn_nthread instances

         // of NetCvodeThreadData. Here since possible checkpoint restore of

         // tqueue at end of phase2.

         nrn_p_construct();

     }


     if (use_solve_interleave) {

         create_interleave_info();

     }


     /// Reserve vector of maps of size ngroup for negative gid-s

     /// std::vector< std::map<int, PreSyn*> > neg_gid2out;

     neg_gid2out.resize(userParams.ngroup);


     // bug fix. gid2out is cumulative over all threads and so do not

     // know how many there are til after phase1

     // A process's complete set of output gids and allocation of each thread's

     // nt.presyns and nt.netcons arrays.

     // Generates the gid2out map which is needed

     // to later count the required number of InputPreSyn

     /// gid2out - map of output presyn-s

     /// std::map<int, PreSyn*> gid2out;

     gid2out.clear();


     nrnthreads_netcon_srcgid.resize(nrn_nthread);

     for (int i = 0; i < nrn_nthread; ++i)

         nrnthreads_netcon_srcgid[i] = nullptr;


     // Gap junctions used to be done first in the sense of reading files

     // and calling gap_mpi_setup. But during phase2, gap_thread_setup and

     // gap_indices_permute were called after NrnThread.data was in its final

     // layout and mechanism permutation was determined. This is no longer

     // ideal as it necessitates keeping setup_info_ in existence to the end

     // of phase2.  So gap junction setup is deferred to after phase2.


     nrnthreads_netcon_negsrcgid_tid.resize(nrn_nthread);

     if (corenrn_file_mode) {

         coreneuron::phase_wrapper<coreneuron::phase::one>(userParams, !corenrn_file_mode);

     } else {

         nrn_multithread_job([](NrnThread* n) {

             Phase1 p1{n->id};

             p1.populate(*n, mut);

         });

     }


     // from the gid2out map and the nrnthreads_netcon_srcgid array,

     // fill the gid2in, and from the number of entries,

     // allocate the process wide InputPreSyn array

     determine_inputpresyn();


     // read the rest of the gidgroup's data and complete the setup for each

     // thread.

     /* nrn_multithread_job supports serial, pthread, and openmp. */

     coreneuron::phase_wrapper<coreneuron::phase::two>(userParams, !corenrn_file_mode);


     // gap junctions

     // Gaps are done after phase2, in order to use layout and permutation

     // information via calls to legacy_index2pointer.

     if (nrn_have_gaps) {

         nrn_partrans::transfer_thread_data_ = new nrn_partrans::TransferThreadData[nrn_nthread];

         if (!corenrn_embedded) {

             nrn_partrans::setup_info_ = new SetupTransferInfo[nrn_nthread];

             coreneuron::phase_wrapper<coreneuron::gap>(userParams);

         } else {

             nrn_partrans::setup_info_ = (*nrn2core_get_partrans_setup_info_)(userParams.ngroup,

                                                                              nrn_nthread,

                                                                              sizeof(sgid_t));

         }


         nrn_multithread_job(nrn_partrans::gap_data_indices_setup);

         nrn_partrans::gap_mpi_setup(userParams.ngroup);


         // Whether allocated in NEURON or here, delete here.

         delete[] nrn_partrans::setup_info_;

         nrn_partrans::setup_info_ = nullptr;

     }


     if (is_mapping_needed)

         coreneuron::phase_wrapper<coreneuron::phase::three>(userParams, !corenrn_file_mode);


     *mindelay = set_mindelay(*mindelay);


     if (run_setup_cleanup)  // if run_setup_cleanup==false, user must call nrn_setup_cleanup() later

         nrn_setup_cleanup();


 #if INTERLEAVE_DEBUG

     // mk_cell_indices debug code is supposed to be used with cell-per-core permutations

     if (corenrn_param.cell_interleave_permute == 1) {

         mk_cell_indices();

     }

 #endif


     /// Allocate memory for fast_imem calculation

     nrn_fast_imem_alloc();


     /// Generally, tables depend on a few parameters. And if those parameters change,

     /// then the table needs to be recomputed. This is obviously important in NEURON

     /// since the user can change those parameters at any time. However, there is no

     /// c example for CoreNEURON so can't see what it looks like in that context.

     /// Boils down to setting up a function pointer of the function _check_table_thread(),

     /// which is only executed by StochKV.c.

     nrn_mk_table_check();  // was done in nrn_thread_memblist_setup in multicore.c


     size_t model_size_bytes;


     if (corenrn_param.model_stats) {

         write_mech_report();

         model_size_bytes = model_size(true);

     } else {

         model_size_bytes = model_size(false);

     }


     if (nrnmpi_myid == 0 && !corenrn_param.is_quiet()) {

         printf(" Setup Done   : %.2lf seconds \n", nrn_wtime() - time);


         if (model_size_bytes < 1024) {

             printf(" Model size   : %ld bytes\n", model_size_bytes);

         } else if (model_size_bytes < 1024 * 1024) {

             printf(" Model size   : %.2lf kB\n", model_size_bytes / 1024.);

         } else if (model_size_bytes < 1024 * 1024 * 1024) {

             printf(" Model size   : %.2lf MB\n", model_size_bytes / (1024. * 1024.));

         } else {

             printf(" Model size   : %.2lf GB\n", model_size_bytes / (1024. * 1024. * 1024.));

         }

     }


     delete[] userParams.gidgroups;

 }


 void setup_ThreadData(NrnThread& nt) {

     for (NrnThreadMembList* tml = nt.tml; tml; tml = tml->next) {

         Memb_func& mf = corenrn.get_memb_func(tml->index);

         Memb_list* ml = tml->ml;

         if (mf.thread_size_) {

             ml->_thread = (ThreadDatum*) ecalloc_align(mf.thread_size_, sizeof(ThreadDatum));

             if (mf.thread_mem_init_) {

                 {

                     const std::lock_guard<OMP_Mutex> lock(mut);

                     (*mf.thread_mem_init_)(ml->_thread);

                 }

             }

         } else {

             ml->_thread = nullptr;

         }

     }

 }


 void read_phasegap(NrnThread& nt, UserParams& userParams) {

     auto& F = userParams.file_reader[nt.id];

     if (F.fail()) {

         return;

     }


     F.checkpoint(0);


     int sidt_size = F.read_int();

     assert(sidt_size == int(sizeof(sgid_t)));

     std::size_t ntar = F.read_int();

     std::size_t nsrc = F.read_int();


     auto& si = nrn_partrans::setup_info_[nt.id];

     si.src_sid.resize(nsrc);

     si.src_type.resize(nsrc);

     si.src_index.resize(nsrc);

     if (nsrc) {

         F.read_array<sgid_t>(si.src_sid.data(), nsrc);

         F.read_array<int>(si.src_type.data(), nsrc);

         F.read_array<int>(si.src_index.data(), nsrc);

     }


     si.tar_sid.resize(ntar);

     si.tar_type.resize(ntar);

     si.tar_index.resize(ntar);

     if (ntar) {

         F.read_array<sgid_t>(si.tar_sid.data(), ntar);

         F.read_array<int>(si.tar_type.data(), ntar);

         F.read_array<int>(si.tar_index.data(), ntar);

     }


 #if CORENRN_DEBUG

     printf("%d read_phasegap tid=%d nsrc=%d ntar=%d\n", nrnmpi_myid, nt.id, nsrc, ntar);

     for (int i = 0; i < nsrc; ++i) {

         printf("src %z %d %d\n", size_t(si.src_sid[i]), si.src_type[i], si.src_index[i]);

     }

     for (int i = 0; i < ntar; ++i) {

         printf("tar %z %d %d\n", size_t(si.src_sid[i]), si.src_type[i], si.src_index[i]);

     }

 #endif

 }


 // This function is related to nrn_dblpntr2nrncore in Neuron to determine which values should

 // be transferred from CoreNeuron. Types correspond to the value to be transferred based on

 // mech_type enum or non-artificial cell mechanisms.

 // take into account alignment, layout, permutation

 // only voltage, i_membrane_ or mechanism data index allowed. (mtype 0 means time)

 double* legacy_index2pointer(int mtype, int index, NrnThread& nt) {

     if (mtype == voltage) {  // voltage

         int ix = index;      // relative to _actual_v

         nrn_assert((ix >= 0) && (ix < nt.end));

         if (nt._permute) {

             node_permute(&ix, 1, nt._permute);

         }

         return nt._actual_v + ix;

     } else if (mtype == i_membrane_) {  // membrane current from fast_imem calculation

         int ix = index;                 // relative to nrn_fast_imem->nrn_sav_rhs

         nrn_assert((ix >= 0) && (ix < nt.end));

         if (nt._permute) {

             node_permute(&ix, 1, nt._permute);

         }

         return nt.nrn_fast_imem->nrn_sav_rhs + ix;

     } else if (mtype > 0 && mtype < static_cast<int>(corenrn.get_memb_funcs().size())) {  //

         Memb_list* ml = nt._ml_list[mtype];

         nrn_assert(ml);


         const std::vector<int>& array_dims = corenrn.get_array_dims()[mtype];

         int padded_node_count = nrn_soa_padded_size(ml->nodecount, Layout::SoA);


         auto soaos_index = legacy2soaos_index(index, array_dims);

         auto cnrn_index =

             soaos2cnrn_index(soaos_index, array_dims, padded_node_count, ml->_permute);


         return ml->data + cnrn_index;

     } else if (mtype == 0) {  // time

         return &nt._t;

     } else {

         printf("legacy_index2pointer does not handle mtype=%d\n", mtype);

         nrn_assert(0);

     }

     return nullptr;

 }


 // from i to (icnt, isz)

 void nrn_inverse_i_layout(int i, int& icnt, int cnt, int& isz, int sz, int layout) {

     if (layout == Layout::AoS) {

         icnt = i / sz;

         isz = i % sz;

     } else if (layout == Layout::SoA) {

         int padded_cnt = nrn_soa_padded_size(cnt, layout);

         icnt = i % padded_cnt;

         isz = i / padded_cnt;

     } else {

         assert(0);

     }

 }


 /**

  * Cleanup global ion map created during mechanism registration

  *

  * In case of coreneuron standalone execution nrn_ion_global_map

  * can be deleted at the end of execution. But in case embedded

  * run via neuron, mechanisms are registered only once i.e. during

  * first call to coreneuron. This is why we call cleanup only in

  * case of standalone coreneuron execution via nrniv-core or

  * special-core.

  *

  * @todo coreneuron should have finalise callback which can be

  * called from NEURON for final memory cleanup including global

  * state like registered mechanisms and ions map.

  */

 void nrn_cleanup_ion_map() {

     for (int i = 0; i < nrn_ion_global_map_size; i++) {

         free_memory(nrn_ion_global_map[i]);

     }

     free_memory(nrn_ion_global_map);

     nrn_ion_global_map = nullptr;

     nrn_ion_global_map_size = 0;

 }


 void delete_fornetcon_info(NrnThread& nt) {

     delete[] std::exchange(nt._fornetcon_perm_indices, nullptr);

     delete[] std::exchange(nt._fornetcon_weight_perm, nullptr);

 }


 /* nrn_threads_free() presumes all NrnThread and NrnThreadMembList data is

  * allocated with malloc(). This is not the case here, so let's try and fix

  * things up first. */


 void nrn_cleanup() {

     clear_event_queue();  // delete left-over TQItem

     for (auto psi: gid2in) {

         delete psi.second;

     }

     gid2in.clear();

     gid2out.clear();


     // clean nrnthread_chkpnt

     if (nrnthread_chkpnt) {

         delete[] nrnthread_chkpnt;

         nrnthread_chkpnt = nullptr;

     }


     // clean NrnThreads

     for (int it = 0; it < nrn_nthread; ++it) {

         NrnThread* nt = nrn_threads + it;

         NrnThreadMembList* next_tml = nullptr;

         delete_fornetcon_info(*nt);

         delete_trajectory_requests(*nt);

         for (NrnThreadMembList* tml = nt->tml; tml; tml = next_tml) {

             Memb_list* ml = tml->ml;


             mod_f_t s = corenrn.get_memb_func(tml->index).destructor;

             if (s) {

                 (*s)(nt, ml, tml->index);

             }


             // Moved from below as priv_dtor is now deleting the RANDOM streams,

             // and at this moment need an undeleted pdata.

             // Destroy the global variables struct allocated in nrn_init

             if (auto* const priv_dtor = corenrn.get_memb_func(tml->index).private_destructor) {

                 (*priv_dtor)(nt, ml, tml->index);

                 assert(!ml->instance);

                 assert(!ml->global_variables);

                 assert(ml->global_variables_size == 0);

             }


             ml->data = nullptr;  // this was pointing into memory owned by nt

             free_memory(ml->pdata);

             ml->pdata = nullptr;

             free_memory(ml->nodeindices);

             ml->nodeindices = nullptr;

             if (ml->_permute) {

                 delete[] ml->_permute;

                 ml->_permute = nullptr;

             }


             if (ml->_thread) {

                 free_memory(ml->_thread);

                 ml->_thread = nullptr;

             }


             NetReceiveBuffer_t* nrb = ml->_net_receive_buffer;

             if (nrb) {

                 if (nrb->_size) {

                     free_memory(nrb->_pnt_index);

                     free_memory(nrb->_weight_index);

                     free_memory(nrb->_nrb_t);

                     free_memory(nrb->_nrb_flag);

                     free_memory(nrb->_displ);

                     free_memory(nrb->_nrb_index);

                 }

                 free_memory(nrb);

                 ml->_net_receive_buffer = nullptr;

             }


             NetSendBuffer_t* nsb = ml->_net_send_buffer;

             if (nsb) {

                 delete nsb;

                 ml->_net_send_buffer = nullptr;

             }


             if (tml->dependencies)

                 free(tml->dependencies);


             next_tml = tml->next;

             free_memory(tml->ml);

             free_memory(tml);

         }


         nt->_actual_rhs = nullptr;

         nt->_actual_d = nullptr;

         nt->_actual_a = nullptr;

         nt->_actual_b = nullptr;


         free_memory(nt->_v_parent_index);

         nt->_v_parent_index = nullptr;


         free_memory(nt->_data);

         nt->_data = nullptr;


         free(nt->_idata);

         nt->_idata = nullptr;


         free_memory(nt->_vdata);

         nt->_vdata = nullptr;


         if (nt->_permute) {

             delete[] nt->_permute;

             nt->_permute = nullptr;

         }


         if (nt->presyns_helper) {

             free_memory(nt->presyns_helper);

             nt->presyns_helper = nullptr;

         }


         delete[] std::exchange(nt->pntprocs, nullptr);

         delete[] std::exchange(nt->presyns, nullptr);


         if (nt->pnt2presyn_ix) {

             for (size_t i = 0; i < corenrn.get_has_net_event().size(); ++i) {

                 if (nt->pnt2presyn_ix[i]) {

                     free(nt->pnt2presyn_ix[i]);

                 }

             }

             free_memory(nt->pnt2presyn_ix);

         }


         if (nt->netcons) {

             delete[] nt->netcons;

             nt->netcons = nullptr;

         }


         if (nt->weights) {

             free_memory(nt->weights);

             nt->weights = nullptr;

         }


         if (nt->_shadow_rhs) {

             free_memory(nt->_shadow_rhs);

             nt->_shadow_rhs = nullptr;

         }


         if (nt->_shadow_d) {

             free_memory(nt->_shadow_d);

             nt->_shadow_d = nullptr;

         }


         if (nt->_net_send_buffer_size) {

             free_memory(nt->_net_send_buffer);

             nt->_net_send_buffer = nullptr;

             nt->_net_send_buffer_size = 0;

         }


         if (nt->_watch_types) {

             free(nt->_watch_types);

             nt->_watch_types = nullptr;

         }


         // mapping information is available only for non-empty NrnThread

         if (nt->mapping && nt->ncell) {

             delete ((NrnThreadMappingInfo*) nt->mapping);

         }


         free_memory(nt->_ml_list);


         if (nt->nrn_fast_imem) {

             fast_imem_free();

         }

     }


 #if NRN_MULTISEND

     nrn_multisend_cleanup();

 #endif


     netcon_in_presyn_order_.clear();


     nrn_threads_free();


     if (!corenrn.get_pnttype2presyn().empty()) {

         corenrn.get_pnttype2presyn().clear();

     }


     destroy_interleave_info();


     nrn_partrans::gap_cleanup();

 }


 void delete_trajectory_requests(NrnThread& nt) {

     if (nt.trajec_requests) {

         TrajectoryRequests* tr = nt.trajec_requests;

         if (tr->n_trajec) {

             delete[] tr->vpr;

             if (tr->scatter) {

                 delete[] tr->scatter;

             }

             if (tr->varrays) {

                 delete[] tr->varrays;

             }

             delete[] tr->gather;

         }

         delete nt.trajec_requests;

         nt.trajec_requests = nullptr;

     }

 }


 void read_phase1(NrnThread& nt, UserParams& userParams) {

     Phase1 p1{userParams.file_reader[nt.id]};


     // Protect gid2in, gid2out and neg_gid2out

     p1.populate(nt, mut);

 }


 void read_phase2(NrnThread& nt, UserParams& userParams) {

     Phase2 p2;

     if (corenrn_embedded && !corenrn_file_mode) {

         p2.read_direct(nt.id, nt);

     } else {

         p2.read_file(userParams.file_reader[nt.id], nt);

     }

     p2.populate(nt, userParams);

 }


 /** read mapping information for neurons */

 void read_phase3(NrnThread& nt, UserParams& userParams) {

     /** mapping information for all neurons in single NrnThread */

     NrnThreadMappingInfo* ntmapping = new NrnThreadMappingInfo();


     Phase3 p3;

     if (corenrn_embedded && !corenrn_file_mode) {

         p3.read_direct(ntmapping);

     } else {

         auto& F = userParams.file_reader[nt.id];

         F.restore_checkpoint();

         p3.read_file(F, ntmapping);

     }


     // make number #cells match with mapping size

     nrn_assert((int) ntmapping->size() == nt.ncell);


     // set pointer in NrnThread

     nt.mapping = (void*) ntmapping;

     nt.summation_report_handler_ = std::make_unique<SummationReportMapping>();

 }


 /* Returns the size of the dynamically allocated memory for NrnThreadMembList

  * Includes:

  *  - Size of NrnThreadMembList

  *  - Size of Memb_list

  *  - Size of nodeindices

  *  - Size of _permute

  *  - Size of _thread

  *  - Size of NetReceive and NetSend Buffers

  *  - Size of int variables

  *  - Size of double variables (If include_data is enabled. Those variables are already counted

  * since they point to nt->_data.)

  */

 size_t memb_list_size(NrnThreadMembList* tml, bool include_data) {

     size_t nbyte = sizeof(NrnThreadMembList) + sizeof(Memb_list);

     nbyte += tml->ml->nodecount * sizeof(int);

     if (tml->ml->_permute) {

         nbyte += tml->ml->nodecount * sizeof(int);

     }

     if (tml->ml->_thread) {

         Memb_func& mf = corenrn.get_memb_func(tml->index);

         nbyte += mf.thread_size_ * sizeof(ThreadDatum);

     }

     if (tml->ml->_net_receive_buffer) {

         nbyte += sizeof(NetReceiveBuffer_t) + tml->ml->_net_receive_buffer->size_of_object();

     }

     if (tml->ml->_net_send_buffer) {

         nbyte += sizeof(NetSendBuffer_t) + tml->ml->_net_send_buffer->size_of_object();

     }

     if (include_data) {

         nbyte += corenrn.get_prop_param_size()[tml->index] * tml->ml->nodecount * sizeof(double);

     }

     nbyte += corenrn.get_prop_dparam_size()[tml->index] * tml->ml->nodecount * sizeof(Datum);

 #ifdef DEBUG

     int i = tml->index;

     printf("%s %d psize=%d ppsize=%d cnt=%d nbyte=%ld\n",

            corenrn.get_memb_func(i).sym,

            i,

            corenrn.get_prop_param_size()[i],

            corenrn.get_prop_dparam_size()[i],

            tml->ml->nodecount,

            nbyte);

 #endif

     return nbyte;

 }


 /// Approximate count of number of bytes for the gid2out map

 size_t output_presyn_size(void) {

     if (gid2out.empty()) {

         return 0;

     }

     size_t nbyte = sizeof(gid2out) + sizeof(int) * gid2out.size() +

                    sizeof(PreSyn*) * gid2out.size();

 #ifdef DEBUG

     printf(" gid2out table bytes=~%ld size=%ld\n", nbyte, gid2out.size());

 #endif

     return nbyte;

 }


 size_t input_presyn_size(void) {

     if (gid2in.empty()) {

         return 0;

     }

     size_t nbyte = sizeof(gid2in) + sizeof(int) * gid2in.size() +

                    sizeof(InputPreSyn*) * gid2in.size();

 #ifdef DEBUG

     printf(" gid2in table bytes=~%ld size=%ld\n", nbyte, gid2in.size());

 #endif

     return nbyte;

 }


 size_t model_size(bool detailed_report) {

     long nbyte = 0;

     size_t sz_nrnThread = sizeof(NrnThread);

     size_t sz_presyn = sizeof(PreSyn);

     size_t sz_input_presyn = sizeof(InputPreSyn);

     size_t sz_netcon = sizeof(NetCon);

     size_t sz_pntproc = sizeof(Point_process);

     size_t nccnt = 0;


     std::vector<long> size_data(13, 0);

     std::vector<long> global_size_data_min(13, 0);

     std::vector<long> global_size_data_max(13, 0);

     std::vector<long> global_size_data_sum(13, 0);

     std::vector<float> global_size_data_avg(13, 0.0);


     for (int i = 0; i < nrn_nthread; ++i) {

         NrnThread& nt = nrn_threads[i];

         size_t nb_nt = 0;  // per thread

         nccnt += nt.n_netcon;


         // Memb_list size

         int nmech = 0;

         for (auto tml = nt.tml; tml; tml = tml->next) {

             nb_nt += memb_list_size(tml, false);

             ++nmech;

         }


         // basic thread size includes mechanism data and G*V=I matrix

         nb_nt += sz_nrnThread;

         nb_nt += nt._ndata * sizeof(double) + nt._nidata * sizeof(int) + nt._nvdata * sizeof(void*);

         nb_nt += nt.end * sizeof(int);  // _v_parent_index


         // network connectivity

         nb_nt += nt.n_pntproc * sz_pntproc + nt.n_netcon * sz_netcon + nt.n_presyn * sz_presyn +

                  nt.n_input_presyn * sz_input_presyn + nt.n_weight * sizeof(double);

         nbyte += nb_nt;


 #ifdef DEBUG

         printf("ncell=%d end=%d nmech=%d\n", nt.ncell, nt.end, nmech);

         printf("ndata=%ld nidata=%ld nvdata=%ld\n", nt._ndata, nt._nidata, nt._nvdata);

         printf("nbyte so far %ld\n", nb_nt);

         printf("n_presyn = %d sz=%ld nbyte=%ld\n", nt.n_presyn, sz_presyn, nt.n_presyn * sz_presyn);

         printf("n_input_presyn = %d sz=%ld nbyte=%ld\n",

                nt.n_input_presyn,

                sz_input_presyn,

                nt.n_input_presyn * sz_input_presyn);

         printf("n_pntproc=%d sz=%ld nbyte=%ld\n",

                nt.n_pntproc,

                sz_pntproc,

                nt.n_pntproc * sz_pntproc);

         printf("n_netcon=%d sz=%ld nbyte=%ld\n", nt.n_netcon, sz_netcon, nt.n_netcon * sz_netcon);

         printf("n_weight = %d\n", nt.n_weight);


         printf("%d thread %d total bytes %ld\n", nrnmpi_myid, i, nb_nt);

 #endif


         if (detailed_report) {

             size_data[0] += nt.ncell;

             size_data[1] += nt.end;

             size_data[2] += nmech;

             size_data[3] += nt._ndata;

             size_data[4] += nt._nidata;

             size_data[5] += nt._nvdata;

             size_data[6] += nt.n_presyn;

             size_data[7] += nt.n_input_presyn;

             size_data[8] += nt.n_pntproc;

             size_data[9] += nt.n_netcon;

             size_data[10] += nt.n_weight;

             size_data[11] += nb_nt;

         }

     }


     nbyte += nccnt * sizeof(NetCon*);

     nbyte += output_presyn_size();

     nbyte += input_presyn_size();


     nbyte += nrnran123_instance_count() * nrnran123_state_size();


 #ifdef DEBUG

     printf("%d netcon pointers %ld  nbyte=%ld\n", nrnmpi_myid, nccnt, nccnt * sizeof(NetCon*));

     printf("nrnran123 size=%ld cnt=%ld nbyte=%ld\n",

            nrnran123_state_size(),

            nrnran123_instance_count(),

            nrnran123_instance_count() * nrnran123_state_size());

     printf("%d total bytes %ld\n", nrnmpi_myid, nbyte);

 #endif

     if (detailed_report) {

         size_data[12] = nbyte;

 #if NRNMPI

         if (corenrn_param.mpi_enable) {

             // last arg is op type where 1 is sum, 2 is max and any other value is min

             nrnmpi_long_allreduce_vec(&size_data[0], &global_size_data_sum[0], 13, 1);

             nrnmpi_long_allreduce_vec(&size_data[0], &global_size_data_max[0], 13, 2);

             nrnmpi_long_allreduce_vec(&size_data[0], &global_size_data_min[0], 13, 3);

             for (int i = 0; i < 13; i++) {

                 global_size_data_avg[i] = global_size_data_sum[i] / float(nrnmpi_numprocs);

             }

         } else

 #endif

         {

             global_size_data_max = size_data;

             global_size_data_min = size_data;

             global_size_data_avg.assign(size_data.cbegin(), size_data.cend());

         }

         // now print the collected data:

         if (nrnmpi_myid == 0) {

             printf("Memory size information for all NrnThreads per rank\n");

             printf("------------------------------------------------------------------\n");

             printf("%22s %12s %12s %12s\n", "field", "min", "max", "avg");

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_cell",

                    global_size_data_min[0],

                    global_size_data_max[0],

                    global_size_data_avg[0]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_compartment",

                    global_size_data_min[1],

                    global_size_data_max[1],

                    global_size_data_avg[1]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_mechanism",

                    global_size_data_min[2],

                    global_size_data_max[2],

                    global_size_data_avg[2]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "_ndata",

                    global_size_data_min[3],

                    global_size_data_max[3],

                    global_size_data_avg[3]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "_nidata",

                    global_size_data_min[4],

                    global_size_data_max[4],

                    global_size_data_avg[4]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "_nvdata",

                    global_size_data_min[5],

                    global_size_data_max[5],

                    global_size_data_avg[5]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_presyn",

                    global_size_data_min[6],

                    global_size_data_max[6],

                    global_size_data_avg[6]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_presyn (bytes)",

                    global_size_data_min[6] * sz_presyn,

                    global_size_data_max[6] * sz_presyn,

                    global_size_data_avg[6] * sz_presyn);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_input_presyn",

                    global_size_data_min[7],

                    global_size_data_max[7],

                    global_size_data_avg[7]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_input_presyn (bytes)",

                    global_size_data_min[7] * sz_input_presyn,

                    global_size_data_max[7] * sz_input_presyn,

                    global_size_data_avg[7] * sz_input_presyn);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_pntproc",

                    global_size_data_min[8],

                    global_size_data_max[8],

                    global_size_data_avg[8]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_pntproc (bytes)",

                    global_size_data_min[8] * sz_pntproc,

                    global_size_data_max[8] * sz_pntproc,

                    global_size_data_avg[8] * sz_pntproc);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_netcon",

                    global_size_data_min[9],

                    global_size_data_max[9],

                    global_size_data_avg[9]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_netcon (bytes)",

                    global_size_data_min[9] * sz_netcon,

                    global_size_data_max[9] * sz_netcon,

                    global_size_data_avg[9] * sz_netcon);

             printf("%22s %12ld %12ld %15.2f\n",

                    "n_weight",

                    global_size_data_min[10],

                    global_size_data_max[10],

                    global_size_data_avg[10]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "NrnThread (bytes)",

                    global_size_data_min[11],

                    global_size_data_max[11],

                    global_size_data_avg[11]);

             printf("%22s %12ld %12ld %15.2f\n",

                    "model size (bytes)",

                    global_size_data_min[12],

                    global_size_data_max[12],

                    global_size_data_avg[12]);

         }

     }


 #if NRNMPI

     if (corenrn_param.mpi_enable) {

         long global_nbyte = 0;

         nrnmpi_long_allreduce_vec(&nbyte, &global_nbyte, 1, 1);

         nbyte = global_nbyte;

     }

 #endif


     return nbyte;

 }


 }  // namespace coreneuron

nrn_has_net_event_
int * nrn_has_net_event_
Definition: init.cpp:161

cellorder.hpp

OMP_Mutex
Definition: nrnmutdec.hpp:55

coreneuron::CheckPoints
Definition: nrn_checkpoint.hpp:17

coreneuron::CoreNeuron::get_memb_func
auto & get_memb_func(size_t idx)
Definition: coreneuron.hpp:135

coreneuron::CoreNeuron::get_memb_funcs
auto & get_memb_funcs()
Definition: coreneuron.hpp:131

coreneuron::CoreNeuron::get_prop_dparam_size
auto & get_prop_dparam_size()
Definition: coreneuron.hpp:171

coreneuron::CoreNeuron::get_array_dims
auto & get_array_dims()
Definition: coreneuron.hpp:163

coreneuron::CoreNeuron::get_has_net_event
auto & get_has_net_event()
Definition: coreneuron.hpp:203

coreneuron::CoreNeuron::get_pnttype2presyn
auto & get_pnttype2presyn()
Definition: coreneuron.hpp:207

coreneuron::CoreNeuron::get_prop_param_size
auto & get_prop_param_size()
Definition: coreneuron.hpp:167

coreneuron::InputPreSyn
Definition: netcon.hpp:130

coreneuron::InputPreSyn::nc_cnt_
int nc_cnt_
Definition: netcon.hpp:133

coreneuron::InputPreSyn::nc_index_
int nc_index_
Definition: netcon.hpp:132

coreneuron::NetCon
Definition: netcon.hpp:45

coreneuron::Phase1
Definition: phase1.hpp:20

coreneuron::Phase2
Definition: phase2.hpp:25

coreneuron::Phase2::read_direct
void read_direct(int thread_id, const NrnThread &nt)
Definition: phase2.cpp:279

coreneuron::Phase2::read_file
void read_file(FileHandler &F, const NrnThread &nt)
Definition: phase2.cpp:126

coreneuron::Phase2::populate
void populate(NrnThread &nt, const UserParams &userParams)
Definition: phase2.cpp:963

coreneuron::Phase3
Definition: phase3.hpp:16

coreneuron::Phase3::read_file
void read_file(FileHandler &F, NrnThreadMappingInfo *ntmapping)
Definition: phase3.cpp:29

coreneuron::Phase3::read_direct
void read_direct(NrnThreadMappingInfo *ntmapping)
Definition: phase3.cpp:48

coreneuron::PreSyn
Definition: netcon.hpp:102

coreneuron::PreSyn::nc_cnt_
int nc_cnt_
Definition: netcon.hpp:108

coreneuron::PreSyn::nc_index_
int nc_index_
Definition: netcon.hpp:107

fp
static Frame * fp
Definition: code.cpp:96

nrnmpi.hpp

nrnmpi.h

cnt
#define cnt
Definition: tqueue.hpp:44

weights
#define weights
Definition: md1redef.h:42

i
#define i
Definition: md1redef.h:19

nrnran123.h

coreneuron.hpp

corenrn_parameters.hpp

fast_imem.hpp

assert
#define assert(ex)
Definition: hocassrt.h:24

mech_report.h

NrnThread
struct NrnThread NrnThread
Definition: membfunc.h:15

memory.h

free_memory
void free_memory(void *pointer)
Definition: memory.h:213

printf
printf
Definition: extdef.h:5

NrnThreadMembList
struct NrnThreadMembList NrnThreadMembList

multicore.hpp

multisend.hpp

coreneuron::nrn_partrans::gap_data_indices_setup
void gap_data_indices_setup(NrnThread *nt)
For now, until conceptualization of the ordering is clear, just replace src setup_info_ indices value...
Definition: partrans_setup.cpp:239

coreneuron::nrn_partrans::transfer_thread_data_
TransferThreadData * transfer_thread_data_
Definition: partrans.cpp:25

coreneuron::nrn_partrans::setup_info_
SetupTransferInfo * setup_info_
Definition: partrans_setup.cpp:23

coreneuron::nrn_partrans::gap_mpi_setup
void gap_mpi_setup(int ngroup)
Definition: partrans_setup.cpp:46

coreneuron::nrn_partrans::gap_cleanup
void gap_cleanup()
Definition: partrans_setup.cpp:271

coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12

coreneuron::nrn_threads
NrnThread * nrn_threads
Definition: multicore.cpp:56

coreneuron::nrn_threads_create
void nrn_threads_create(int n)
Definition: multicore.cpp:102

coreneuron::soaos2cnrn_index
int soaos2cnrn_index(const std::array< int, 3 > &soaos_indices, const std::vector< int > &array_dims, int padded_node_count, int *permute)
Compute the CoreNEURON index given an SoAoS index.
Definition: mem_layout_util.cpp:69

coreneuron::nrn_inverse_i_layout
void nrn_inverse_i_layout(int i, int &icnt, int cnt, int &isz, int sz, int layout)
Definition: nrn_setup.cpp:680

coreneuron::clear_event_queue
void clear_event_queue()
Definition: cvodestb.cpp:47

coreneuron::mod_f_t
void(*)(NrnThread *, Memb_list *, int) mod_f_t
Definition: membfunc.hpp:24

coreneuron::mut
static OMP_Mutex mut
Definition: nrn_setup.cpp:154

coreneuron::output_presyn_size
size_t output_presyn_size(void)
Approximate count of number of bytes for the gid2out map.
Definition: nrn_setup.cpp:1008

coreneuron::nrn_cleanup
void nrn_cleanup()
Definition: nrn_setup.cpp:725

coreneuron::write_mech_report
void write_mech_report()
display global mechanism count
Definition: mech_report.cpp:19

coreneuron::read_phase1
void read_phase1(NrnThread &nt, UserParams &userParams)
Definition: nrn_setup.cpp:923

coreneuron::i_membrane_
@ i_membrane_
Definition: nrniv_decl.h:19

coreneuron::voltage
@ voltage
Definition: nrniv_decl.h:19

coreneuron::ecalloc_align
void * ecalloc_align(size_t n, size_t size, size_t alignment)

coreneuron::input_presyn_size
size_t input_presyn_size(void)
Definition: nrn_setup.cpp:1020

coreneuron::nrn_nthread
int nrn_nthread
Definition: multicore.cpp:55

coreneuron::nrn_ion_global_map
double ** nrn_ion_global_map

coreneuron::nrn_setup
void nrn_setup(const char *filesdat, bool is_mapping_needed, CheckPoints &checkPoints, bool run_setup_cleanup, const char *datpath, const char *restore_path, double *mindelay)
Definition: nrn_setup.cpp:409

coreneuron::t
double t
Definition: register_mech.cpp:23

coreneuron::gid2in
std::map< int, InputPreSyn * > gid2in
Definition: nrn_setup.cpp:160

coreneuron::nrn_have_gaps
bool nrn_have_gaps
variables defined in coreneuron library
Definition: partrans.cpp:21

coreneuron::nrn_fast_imem_alloc
void nrn_fast_imem_alloc()
Definition: fast_imem.cpp:32

coreneuron::use_multisend_
bool use_multisend_
Definition: multisend.cpp:53

coreneuron::memb_list_size
size_t memb_list_size(NrnThreadMembList *tml, bool include_data)
Definition: nrn_setup.cpp:974

coreneuron::nrn_fatal_error
static void nrn_fatal_error(const char *msg)
Definition: nrnmpi.cpp:31

coreneuron::nrnmpi_numprocs
int nrnmpi_numprocs
Definition: nrnmpi_def_cinc.cpp:10

coreneuron::nrn_mk_table_check
void nrn_mk_table_check()
Definition: multicore.cpp:133

coreneuron::netpar_tid_gid2ps
void netpar_tid_gid2ps(int tid, int gid, PreSyn **ps, InputPreSyn **psi)
Definition: nrn_setup.cpp:233

coreneuron::Datum
int Datum
Definition: nrnconf.h:23

coreneuron::neg_gid2out
std::vector< std::map< int, PreSyn * > > neg_gid2out
Vector of maps for negative presyns.
Definition: nrn_setup.cpp:157

coreneuron::use_solve_interleave
bool use_solve_interleave
Definition: solve_core.cpp:13

coreneuron::nrnthreads_netcon_negsrcgid_tid
std::vector< std::vector< int > > nrnthreads_netcon_negsrcgid_tid
If a nrnthreads_netcon_srcgid is negative, need to determine the thread when in order to use the corr...
Definition: nrn_setup.cpp:170

coreneuron::read_phase3
void read_phase3(NrnThread &nt, UserParams &userParams)
read mapping information for neurons
Definition: nrn_setup.cpp:941

coreneuron::check_bbcore_write_version
void check_bbcore_write_version(const char *)
Definition: nrnoc_aux.cpp:128

coreneuron::nrnmpi_myid
int nrnmpi_myid
Definition: nrnmpi_def_cinc.cpp:11

coreneuron::nrn_read_filesdat
void nrn_read_filesdat(int &ngrp, int *&grp, const char *filesdat)
Definition: nrn_setup.cpp:173

coreneuron::nrnthreads_netcon_srcgid
std::vector< int * > nrnthreads_netcon_srcgid
Only for setup vector of netcon source gids.
Definition: nrn_setup.cpp:166

coreneuron::delete_trajectory_requests
void delete_trajectory_requests(NrnThread &nt)
Definition: nrn_setup.cpp:905

coreneuron::legacy2soaos_index
std::array< int, 3 > legacy2soaos_index(int legacy_index, const std::vector< int > &array_dims)
Split a legacy index into the three SoAoS indices.
Definition: mem_layout_util.cpp:47

coreneuron::AoS
@ AoS
Definition: nrniv_decl.h:70

coreneuron::SoA
@ SoA
Definition: nrniv_decl.h:70

coreneuron::nrn_p_construct
void nrn_p_construct()
Definition: netcvode.cpp:175

coreneuron::read_phasegap
void read_phasegap(NrnThread &nt, UserParams &userParams)
Definition: nrn_setup.cpp:595

coreneuron::corenrn
CoreNeuron corenrn
Definition: multicore.cpp:53

coreneuron::nrn_get_mechtype
int nrn_get_mechtype(const char *name)
Get mechanism type by the mechanism name.
Definition: mk_mech.cpp:145

coreneuron::setup_ThreadData
void setup_ThreadData(NrnThread &nt)
Definition: nrn_setup.cpp:577

coreneuron::nrn_threads_free
void nrn_threads_free()
Definition: multicore.cpp:125

coreneuron::set_mindelay
double set_mindelay(double maxdelay)
Definition: netpar.cpp:643

coreneuron::patstimtype
int patstimtype
Definition: nrn_checkpoint.cpp:688

coreneuron::nrn_wtime
double nrn_wtime()
Definition: utils.cpp:22

coreneuron::nrnthread_chkpnt
NrnThreadChkpnt * nrnthread_chkpnt
Definition: nrn_checkpoint.cpp:686

coreneuron::nrn_multisend_setup
void nrn_multisend_setup()

coreneuron::nrnran123_instance_count
std::size_t nrnran123_instance_count()
Definition: nrnran123.cpp:107

coreneuron::nrn_setup_cleanup
void nrn_setup_cleanup()
Clean up.
Definition: nrn_setup.cpp:399

coreneuron::nrn_soa_padded_size
int nrn_soa_padded_size(int cnt, int layout)
calculate size after padding for specific memory layout
Definition: mem_layout_util.cpp:17

coreneuron::legacy_index2pointer
double * legacy_index2pointer(int mtype, int index, NrnThread &nt)
Definition: nrn_setup.cpp:643

coreneuron::nrn_multithread_job
void nrn_multithread_job(F &&job, Args &&... args)
Definition: multicore.hpp:161

coreneuron::determine_inputpresyn
void determine_inputpresyn()
Definition: nrn_setup.cpp:256

coreneuron::fast_imem_free
void fast_imem_free()
Definition: fast_imem.cpp:21

coreneuron::netcon_in_presyn_order_
std::vector< NetCon * > netcon_in_presyn_order_
InputPreSyn.nc_index_ to + InputPreSyn.nc_cnt_ give the NetCon*.
Definition: nrn_setup.cpp:163

coreneuron::model_size
size_t model_size(bool detailed_report)
Definition: nrn_setup.cpp:1032

coreneuron::nrn_multisend_cleanup
void nrn_multisend_cleanup()

coreneuron::delete_fornetcon_info
void delete_fornetcon_info(NrnThread &nt)
Definition: nrn_setup.cpp:716

coreneuron::nrn_ion_global_map_size
int nrn_ion_global_map_size

coreneuron::gid2out
std::map< int, PreSyn * > gid2out
Maps for ouput and input presyns.
Definition: nrn_setup.cpp:159

coreneuron::corenrn_param
corenrn_parameters corenrn_param
Printing method.
Definition: corenrn_parameters.cpp:269

coreneuron::nrn_cleanup_ion_map
void nrn_cleanup_ion_map()
Cleanup global ion map created during mechanism registration.
Definition: nrn_setup.cpp:707

coreneuron::read_phase2
void read_phase2(NrnThread &nt, UserParams &userParams)
Definition: nrn_setup.cpp:930

neuron::create_interleave_info
void create_interleave_info()
Definition: cellorder.cpp:110

neuron::destroy_interleave_info
void destroy_interleave_info()
Definition: cellorder.cpp:115

node_permute.h

nrn_assert.h

nrn_assert
#define nrn_assert(x)
assert()-like macro, independent of NDEBUG status
Definition: nrn_assert.h:33

nrn_checkpoint.hpp

corenrn_embedded_nthread
int corenrn_embedded_nthread
Definition: nrn_setup.cpp:49

nrn2core_all_weights_return_
void(* nrn2core_all_weights_return_)(std::vector< double * > &weights)
Definition: nrn_setup.cpp:75

nrn2core_trajectory_values_
void(* nrn2core_trajectory_values_)(int tid, int n_pr, void **vpr, double t)
Definition: nrn_setup.cpp:69

corenrn_file_mode
bool corenrn_file_mode
Definition: nrn_setup.cpp:48

nrn2core_get_trajectory_requests_
void(* nrn2core_get_trajectory_requests_)(int tid, int &bsize, int &n_pr, void **&vpr, int &n_trajec, int *&types, int *&indices, double **&pvars, double **&varrays)
Definition: nrn_setup.cpp:59

corenrn_embedded
bool corenrn_embedded
--> Coreneuron
Definition: nrn_setup.cpp:47

nrn2core_all_spike_vectors_return_
int(* nrn2core_all_spike_vectors_return_)(std::vector< double > &spikevec, std::vector< int > &gidvec)
Definition: nrn_setup.cpp:73

nrn2core_group_ids_
void(* nrn2core_group_ids_)(int *)
Definition: nrn_setup.cpp:51

nrn2core_trajectory_return_
void(* nrn2core_trajectory_return_)(int tid, int n_pr, int bsize, int vecsz, void **vpr, double t)
Definition: nrn_setup.cpp:71

nrn_setup.hpp

nrnconf.h

n
int const size_t const size_t n
Definition: nrngsl.h:10

s
s
Definition: multisend.cpp:521

nrniv_decl.h

nrnmutdec.hpp

index
short index
Definition: cabvars.h:11

memb_func
std::vector< Memb_func > memb_func
Definition: init.cpp:145

nrnoc_aux.hpp

nrnreport.hpp

nrnsection_mapping.hpp

lock
#define lock
Definition: nvector_nrnthread.cpp:72

partrans.hpp

sgid_t
int sgid_t
Definition: partrans.hpp:20

phase1.hpp

phase2.hpp

phase3.hpp

SetupTransferInfo
Definition: partrans.hpp:94

SetupTransferInfo::src_sid
std::vector< sgid_t > src_sid
Definition: partrans.hpp:95

coreneuron::Memb_func
Definition: membfunc.hpp:32

coreneuron::Memb_func::thread_size_
int thread_size_
Definition: membfunc.hpp:47

coreneuron::Memb_func::thread_mem_init_
void(* thread_mem_init_)(ThreadDatum *)
Definition: membfunc.hpp:48

coreneuron::Memb_list
Definition: mechanism.hpp:131

coreneuron::Memb_list::data
double * data
Definition: mechanism.hpp:139

coreneuron::Memb_list::_thread
ThreadDatum * _thread
Definition: mechanism.hpp:141

coreneuron::Memb_list::nodecount
int nodecount
Definition: mechanism.hpp:144

coreneuron::Memb_list::pdata
Datum * pdata
Definition: mechanism.hpp:140

coreneuron::Memb_list::_net_send_buffer
NetSendBuffer_t * _net_send_buffer
Definition: mechanism.hpp:143

coreneuron::Memb_list::nodeindices
int * nodeindices
Definition: mechanism.hpp:137

coreneuron::Memb_list::_permute
int * _permute
Definition: mechanism.hpp:138

coreneuron::Memb_list::_net_receive_buffer
NetReceiveBuffer_t * _net_receive_buffer
Definition: mechanism.hpp:142

coreneuron::NetReceiveBuffer_t
Definition: mechanism.hpp:41

coreneuron::NetReceiveBuffer_t::_nrb_flag
double * _nrb_flag
Definition: mechanism.hpp:48

coreneuron::NetReceiveBuffer_t::_pnt_index
int * _pnt_index
Definition: mechanism.hpp:45

coreneuron::NetReceiveBuffer_t::size_of_object
size_t size_of_object()
Definition: mechanism.hpp:53

coreneuron::NetReceiveBuffer_t::_nrb_t
double * _nrb_t
Definition: mechanism.hpp:47

coreneuron::NetReceiveBuffer_t::_nrb_index
int * _nrb_index
Definition: mechanism.hpp:43

coreneuron::NetReceiveBuffer_t::_displ
int * _displ
Definition: mechanism.hpp:42

coreneuron::NetReceiveBuffer_t::_size
int _size
Definition: mechanism.hpp:51

coreneuron::NetReceiveBuffer_t::_weight_index
int * _weight_index
Definition: mechanism.hpp:46

coreneuron::NetSendBuffer_t
Definition: mechanism.hpp:62

coreneuron::NetSendBuffer_t::size_of_object
size_t size_of_object()
Definition: mechanism.hpp:88

coreneuron::NrnFastImem::nrn_sav_rhs
double * nrn_sav_rhs
Definition: multicore.hpp:53

coreneuron::NrnThreadChkpnt
Definition: nrn_checkpoint.hpp:87

coreneuron::NrnThread
Definition: multicore.hpp:75

coreneuron::NrnThread::_net_send_buffer_size
int _net_send_buffer_size
Definition: multicore.hpp:138

coreneuron::NrnThread::presyns_helper
PreSynHelper * presyns_helper
Definition: multicore.hpp:84

coreneuron::NrnThread::_actual_v
double * _actual_v
Definition: multicore.hpp:115

coreneuron::NrnThread::n_input_presyn
int n_input_presyn
Definition: multicore.hpp:93

coreneuron::NrnThread::_actual_a
double * _actual_a
Definition: multicore.hpp:113

coreneuron::NrnThread::n_presyn
int n_presyn
Definition: multicore.hpp:94

coreneuron::NrnThread::mapping
void * mapping
Definition: multicore.hpp:143

coreneuron::NrnThread::_watch_types
int * _watch_types
Definition: multicore.hpp:142

coreneuron::NrnThread::_data
double * _data
Definition: multicore.hpp:106

coreneuron::NrnThread::presyns
PreSyn * presyns
Definition: multicore.hpp:83

coreneuron::NrnThread::id
int id
Definition: multicore.hpp:99

coreneuron::NrnThread::_nidata
size_t _nidata
Definition: multicore.hpp:105

coreneuron::NrnThread::n_pntproc
int n_pntproc
Definition: multicore.hpp:90

coreneuron::NrnThread::ncell
int ncell
Definition: multicore.hpp:97

coreneuron::NrnThread::nrn_fast_imem
NrnFastImem * nrn_fast_imem
Definition: multicore.hpp:124

coreneuron::NrnThread::n_netcon
int n_netcon
Definition: multicore.hpp:92

coreneuron::NrnThread::end
int end
Definition: multicore.hpp:98

coreneuron::NrnThread::n_weight
int n_weight
Definition: multicore.hpp:91

coreneuron::NrnThread::pnt2presyn_ix
int ** pnt2presyn_ix
Definition: multicore.hpp:85

coreneuron::NrnThread::_actual_b
double * _actual_b
Definition: multicore.hpp:114

coreneuron::NrnThread::netcons
NetCon * netcons
Definition: multicore.hpp:87

coreneuron::NrnThread::_nvdata
size_t _nvdata
Definition: multicore.hpp:104

coreneuron::NrnThread::_vdata
void ** _vdata
Definition: multicore.hpp:108

coreneuron::NrnThread::_actual_d
double * _actual_d
Definition: multicore.hpp:112

coreneuron::NrnThread::_fornetcon_weight_perm
size_t * _fornetcon_weight_perm
Definition: multicore.hpp:152

coreneuron::NrnThread::_fornetcon_perm_indices
size_t * _fornetcon_perm_indices
Definition: multicore.hpp:150

coreneuron::NrnThread::_ndata
size_t _ndata
Definition: multicore.hpp:103

coreneuron::NrnThread::_ml_list
Memb_list ** _ml_list
Definition: multicore.hpp:81

coreneuron::NrnThread::_permute
int * _permute
Definition: multicore.hpp:127

coreneuron::NrnThread::_net_send_buffer
int * _net_send_buffer
Definition: multicore.hpp:140

coreneuron::NrnThread::_v_parent_index
int * _v_parent_index
Definition: multicore.hpp:126

coreneuron::NrnThread::summation_report_handler_
std::unique_ptr< SummationReportMapping > summation_report_handler_
Definition: multicore.hpp:144

coreneuron::NrnThread::_actual_rhs
double * _actual_rhs
Definition: multicore.hpp:111

coreneuron::NrnThread::tml
NrnThreadMembList * tml
Definition: multicore.hpp:80

coreneuron::NrnThread::weights
double * weights
Definition: multicore.hpp:88

coreneuron::NrnThread::trajec_requests
TrajectoryRequests * trajec_requests
Definition: multicore.hpp:146

coreneuron::NrnThread::_shadow_d
double * _shadow_d
Definition: multicore.hpp:120

coreneuron::NrnThread::pntprocs
Point_process * pntprocs
Definition: multicore.hpp:82

coreneuron::NrnThread::_t
double _t
Definition: multicore.hpp:76

coreneuron::NrnThread::_idata
int * _idata
Definition: multicore.hpp:107

coreneuron::NrnThread::_shadow_rhs
double * _shadow_rhs
Definition: multicore.hpp:118

coreneuron::NrnThreadMappingInfo
Compartment mapping information for NrnThread.
Definition: nrnsection_mapping.hpp:170

coreneuron::NrnThreadMappingInfo::size
size_t size() const
number of cells
Definition: nrnsection_mapping.hpp:180

coreneuron::NrnThreadMembList
Definition: multicore.hpp:32

coreneuron::NrnThreadMembList::ml
Memb_list * ml
Definition: multicore.hpp:34

coreneuron::NrnThreadMembList::next
NrnThreadMembList * next
Definition: multicore.hpp:33

coreneuron::NrnThreadMembList::index
int index
Definition: multicore.hpp:35

coreneuron::Point_process
Definition: mechanism.hpp:35

coreneuron::TrajectoryRequests
Definition: multicore.hpp:57

coreneuron::TrajectoryRequests::vpr
void ** vpr
Definition: multicore.hpp:58

coreneuron::TrajectoryRequests::scatter
double ** scatter
Definition: multicore.hpp:59

coreneuron::TrajectoryRequests::gather
double ** gather
Definition: multicore.hpp:61

coreneuron::TrajectoryRequests::n_trajec
int n_trajec
Definition: multicore.hpp:63

coreneuron::TrajectoryRequests::varrays
double ** varrays
Definition: multicore.hpp:60

coreneuron::UserParams
This structure is data needed is several part of nrn_setup, phase1 and phase2.
Definition: user_params.hpp:18

coreneuron::UserParams::ngroup
const int ngroup
direct memory mode with neuron, do not open files Number of local cell groups
Definition: user_params.hpp:33

coreneuron::UserParams::gidgroups
const int *const gidgroups
Array of cell group numbers (indices)
Definition: user_params.hpp:35

coreneuron::UserParams::file_reader
std::vector< FileHandler > file_reader
Definition: user_params.hpp:40

coreneuron::corenrn_parameters_data::model_stats
bool model_stats
Print version and exit.
Definition: corenrn_parameters.hpp:73

coreneuron::corenrn_parameters_data::cell_interleave_permute
unsigned cell_interleave_permute
Spike Compression.
Definition: corenrn_parameters.hpp:55

coreneuron::corenrn_parameters_data::mpi_enable
bool mpi_enable
Initialization seed for random number generator (int)
Definition: corenrn_parameters.hpp:61

coreneuron::corenrn_parameters::is_quiet
bool is_quiet()
Definition: corenrn_parameters.hpp:111

coreneuron::nrn_partrans::TransferThreadData
The basic problem is to copy sources to targets.
Definition: partrans.hpp:78

coreneuron::version
Project version information.
Definition: config.h:26

coreneuron::ThreadDatum
Definition: mechanism.hpp:26

utils.hpp