3466/doxygen/coreneuron_2network_2multisend_8cpp_source.html

 /*

 # =============================================================================

 # Copyright (c) 2016 - 2021 Blue Brain Project/EPFL

 #

 # See top-level LICENSE file for details.

 # =============================================================================

 */


 #include "coreneuron/nrniv/nrniv_decl.h"

 #include "coreneuron/network/multisend.hpp"

 #include "coreneuron/sim/multicore.hpp"

 #include "coreneuron/network/netcon.hpp"

 #include "coreneuron/network/netcvode.hpp"


 /*

 Overall exchange strategy


 When a cell spikes, it immediately does a multisend of

 (int gid, double spiketime) to all the target machines that have

 cells that need to receive this spike by spiketime + delay.

 The MPI implementation does not block due to use of MPI_Isend.


 In order to minimize the number of nrnmpi_multisend_conserve tests

 (and potentially abandon them altogether if I can ever guarantee

 that exchange time is less than half the computation time), I divide the

 minimum delay integration intervals into two equal subintervals.

 So if a spike is generated in an even subinterval, I do not have

 to include it in the conservation check until the end of the next even

 subinterval.


 When a spike is received (generally MPI_Iprobe, MPI_Recv) it is placed in

 even or odd buffers (depending on whether the coded gid is positive or negative)


 At the end of a computation subinterval the even or odd buffer spikes

 are enqueued in the priority queue after checking that the number

 of spikes sent is equal to the number of spikes sent.

 */


 // The initial idea behind the optional phase2 is to avoid the large overhead of

 // initiating a send of the up to 10k list of target hosts when a cell fires.

 // I.e. when there are a small number of cells on a processor, this causes

 // load balance problems.

 // Load balance should be better if the send is distributed to a much smaller

 // set of targets, which, when they receive the spike, pass it on to a neighbor

 // set. A non-exclusive alternative to this is the use of RECORD_REPLAY

 // which give a very fast initiation but we have not been able to get that

 // to complete in the sense of all the targets receiving their spikes before

 // the conservation step.

 // We expect that phase2 will work best in combination with ENQUEUE=2

 // which has the greatest amount of overlap between computation

 // and communication.

 namespace coreneuron {

 bool use_multisend_;

 bool use_phase2_;

 int n_multisend_interval = 2;


 #if NRN_MULTISEND


 // ENQUEUE 0 means to  Multisend_ReceiveBuffer buffer -> InputPreSyn.send

 // ENQUEUE 1 means to Multisend_ReceiveBuffer buffer -> psbuf -> InputPreSyn.send

 // ENQUEUE 2 means to Multisend_ReceiveBuffer.incoming -> InputPrySyn.send

 // Note that ENQUEUE 2 give more overlap between computation and exchange

 // since the enqueuing takes place during computation except for those

 // remaining during conservation.

 #define ENQUEUE 2


 #if ENQUEUE == 2

 static unsigned long enq2_find_time_;

 static unsigned long enq2_enqueue_time_;  // includes enq_find_time_

 #endif


 #define PHASE2BUFFER_SIZE 2048  // power of 2

 #define PHASE2BUFFER_MASK (PHASE2BUFFER_SIZE - 1)

 struct Phase2Buffer {

     InputPreSyn* ps;

     double spiketime;

     int gid;

 };


 #define MULTISEND_RECEIVEBUFFER_SIZE 10000

 class Multisend_ReceiveBuffer {

   public:

     Multisend_ReceiveBuffer();

     virtual ~Multisend_ReceiveBuffer();

     void init(int index);

     void incoming(int gid, double spiketime);

     void enqueue();

     int index_{};

     int size_{MULTISEND_RECEIVEBUFFER_SIZE};

     int count_{};

     int maxcount_{};

     bool busy_{};

     int nsend_{}, nrecv_{};  // for checking conservation

     int nsend_cell_{};       // cells that spiked this interval.

     NRNMPI_Spike** buffer_{};


     void enqueue1();

     void enqueue2();

     InputPreSyn** psbuf_{};


     void phase2send();

     int phase2_head_{};

     int phase2_tail_{};

     int phase2_nsend_cell_{}, phase2_nsend_{};

     Phase2Buffer* phase2_buffer_{};

 };


 #define MULTISEND_INTERVAL 2

 static Multisend_ReceiveBuffer* multisend_receive_buffer[MULTISEND_INTERVAL];

 static int current_rbuf, next_rbuf;

 #if MULTISEND_INTERVAL == 2

 // note that if a spike is supposed to be received by multisend_receive_buffer[1]

 // then during transmission its gid is complemented.

 #endif


 static int* targets_phase1_;

 static int* targets_phase2_;


 void nrn_multisend_send(PreSyn* ps, double t, NrnThread* nt) {

     int i = ps->multisend_index_;

     if (i >= 0) {

         // format is cnt, cnt_phase1, array of target ranks.

         // Valid for one or two phase.

         int* ranks = targets_phase1_ + i;

         int cnt = ranks[0];

         int cnt_phase1 = ranks[1];

         ranks += 2;

         NRNMPI_Spike spk;

         spk.gid = ps->output_index_;

         spk.spiketime = t;

         if (next_rbuf == 1) {

             spk.gid = ~spk.gid;

         }

         if (nt == nrn_threads) {

             multisend_receive_buffer[next_rbuf]->nsend_ += cnt;

             multisend_receive_buffer[next_rbuf]->nsend_cell_ += 1;

             nrnmpi_multisend(&spk, cnt_phase1, ranks);

         } else {

             assert(0);

         }

     }

 }


 static void multisend_send_phase2(InputPreSyn* ps, int gid, double t) {

     int i = ps->multisend_phase2_index_;

     assert(i >= 0);

     // format is cnt_phase2, array of target ranks

     int* ranks = targets_phase2_ + i;

     int cnt_phase2 = ranks[0];

     ranks += 1;

     NRNMPI_Spike spk;

     spk.gid = gid;

     spk.spiketime = t;

     nrnmpi_multisend(&spk, cnt_phase2, ranks);

 }


 Multisend_ReceiveBuffer::Multisend_ReceiveBuffer()

     : buffer_ {

     new NRNMPI_Spike*[size_]

 }

 #if ENQUEUE == 1

 , psbuf_ {

     new InputPreSyn*[size_]

 }

 #endif

 , phase2_buffer_{new Phase2Buffer[PHASE2BUFFER_SIZE]} {}


 Multisend_ReceiveBuffer::~Multisend_ReceiveBuffer() {

     nrn_assert(!busy_);

     for (int i = 0; i < count_; ++i) {

         delete buffer_[i];

     }

     delete[] buffer_;

     if (psbuf_)

         delete[] psbuf_;

     delete[] phase2_buffer_;

 }

 void Multisend_ReceiveBuffer::init(int index) {

     index_ = index;

     nsend_cell_ = nsend_ = nrecv_ = maxcount_ = 0;

     busy_ = false;

     for (int i = 0; i < count_; ++i) {

         delete buffer_[i];

     }

     count_ = 0;


     phase2_head_ = phase2_tail_ = 0;

     phase2_nsend_cell_ = phase2_nsend_ = 0;

 }

 void Multisend_ReceiveBuffer::incoming(int gid, double spiketime) {

     // printf("%d %p.incoming %g %g %d\n", nrnmpi_myid, this, t, spk->spiketime, spk->gid);

     nrn_assert(!busy_);

     busy_ = true;


     if (count_ >= size_) {

         size_ *= 2;

         NRNMPI_Spike** newbuf = new NRNMPI_Spike*[size_];

         for (int i = 0; i < count_; ++i) {

             newbuf[i] = buffer_[i];

         }

         delete[] buffer_;

         buffer_ = newbuf;

         if (psbuf_) {

             delete[] psbuf_;

             psbuf_ = new InputPreSyn*[size_];

         }

     }

     NRNMPI_Spike* spk = new NRNMPI_Spike();

     spk->gid = gid;

     spk->spiketime = spiketime;

     buffer_[count_++] = spk;

     if (maxcount_ < count_) {

         maxcount_ = count_;

     }


     ++nrecv_;

     busy_ = false;

 }

 void Multisend_ReceiveBuffer::enqueue() {

     // printf("%d %p.enqueue count=%d t=%g nrecv=%d nsend=%d\n", nrnmpi_myid, this, t, count_,

     // nrecv_, nsend_);

     nrn_assert(!busy_);

     busy_ = true;


     for (int i = 0; i < count_; ++i) {

         NRNMPI_Spike* spk = buffer_[i];


         auto gid2in_it = gid2in.find(spk->gid);

         assert(gid2in_it != gid2in.end());

         InputPreSyn* ps = gid2in_it->second;


         if (use_phase2_ && ps->multisend_phase2_index_ >= 0) {

             Phase2Buffer& pb = phase2_buffer_[phase2_head_++];

             phase2_head_ &= PHASE2BUFFER_MASK;

             assert(phase2_head_ != phase2_tail_);

             pb.ps = ps;

             pb.spiketime = spk->spiketime;

             pb.gid = spk->gid;

         }


         ps->send(spk->spiketime, net_cvode_instance, nrn_threads);

         delete spk;

     }


     count_ = 0;

 #if ENQUEUE != 2

     nrecv_ = 0;

     nsend_ = 0;

     nsend_cell_ = 0;

 #endif

     busy_ = false;

     phase2send();

 }


 void Multisend_ReceiveBuffer::enqueue1() {

     // printf("%d %lx.enqueue count=%d t=%g nrecv=%d nsend=%d\n", nrnmpi_myid, (long)this, t,

     // count_, nrecv_, nsend_);

     nrn_assert(!busy_);

     busy_ = true;

     for (int i = 0; i < count_; ++i) {

         NRNMPI_Spike* spk = buffer_[i];


         auto gid2in_it = gid2in.find(spk->gid);

         assert(gid2in_it != gid2in.end());

         InputPreSyn* ps = gid2in_it->second;

         psbuf_[i] = ps;

         if (use_phase2_ && ps->multisend_phase2_index_ >= 0) {

             Phase2Buffer& pb = phase2_buffer_[phase2_head_++];

             phase2_head_ &= PHASE2BUFFER_MASK;

             assert(phase2_head_ != phase2_tail_);

             pb.ps = ps;

             pb.spiketime = spk->spiketime;

             pb.gid = spk->gid;

         }

     }

     busy_ = false;

     phase2send();

 }


 void Multisend_ReceiveBuffer::enqueue2() {

     // printf("%d %lx.enqueue count=%d t=%g nrecv=%d nsend=%d\n", nrnmpi_myid, (long)this, t,

     // count_, nrecv_, nsend_);

     nrn_assert(!busy_);

     busy_ = false;

     for (int i = 0; i < count_; ++i) {

         NRNMPI_Spike* spk = buffer_[i];

         InputPreSyn* ps = psbuf_[i];

         ps->send(spk->spiketime, net_cvode_instance, nrn_threads);

         delete spk;

     }

     count_ = 0;

     nrecv_ = 0;

     nsend_ = 0;

     nsend_cell_ = 0;

     busy_ = false;

 }


 void Multisend_ReceiveBuffer::phase2send() {

     while (phase2_head_ != phase2_tail_) {

         Phase2Buffer& pb = phase2_buffer_[phase2_tail_++];

         phase2_tail_ &= PHASE2BUFFER_MASK;

         int gid = pb.gid;

         if (index_) {

             gid = ~gid;

         }

         multisend_send_phase2(pb.ps, gid, pb.spiketime);

     }

 }


 static int max_ntarget_host;

 // For one phase sending, max_multisend_targets is max_ntarget_host.

 // For two phase sending, it is the maximum of all the

 // ntarget_hosts_phase1 and ntarget_hosts_phase2.

 static int max_multisend_targets;


 void nrn_multisend_init() {

     for (int i = 0; i < n_multisend_interval; ++i) {

         multisend_receive_buffer[i]->init(i);

     }

     current_rbuf = 0;

     next_rbuf = n_multisend_interval - 1;

 #if ENQUEUE == 2

     enq2_find_time_ = enq2_enqueue_time_ = 0;

 #endif

 }


 static int multisend_advance() {

     NRNMPI_Spike spk;

     int i = 0;

     while (nrnmpi_multisend_single_advance(&spk)) {

         i += 1;

         int j = 0;

 #if MULTISEND_INTERVAL == 2

         if (spk.gid < 0) {

             spk.gid = ~spk.gid;

             j = 1;

         }

 #endif

         multisend_receive_buffer[j]->incoming(spk.gid, spk.spiketime);

     }

     return i;

 }


 #if NRN_MULTISEND

 void nrn_multisend_advance() {

     if (use_multisend_) {

         multisend_advance();

 #if ENQUEUE == 2

         multisend_receive_buffer[current_rbuf]->enqueue();

 #endif

     }

 }

 #endif


 void nrn_multisend_receive(NrnThread* nt) {

     //  nrn_spike_exchange();

     assert(nt == nrn_threads);

     //  double w1, w2;

     int ncons = 0;

     int& s = multisend_receive_buffer[current_rbuf]->nsend_;

     int& r = multisend_receive_buffer[current_rbuf]->nrecv_;

 //  w1 = nrn_wtime();

 #if NRN_MULTISEND & 1

     if (use_multisend_) {

         nrn_multisend_advance();

         nrnmpi_barrier();

         nrn_multisend_advance();

         // with two phase we expect conservation to hold and ncons should

         // be 0.

         while (nrnmpi_multisend_conserve(s, r) != 0) {

             nrn_multisend_advance();

             ++ncons;

         }

     }

 #endif

     //  w1 = nrn_wtime() - w1;

     //  w2 = nrn_wtime();


 #if ENQUEUE == 0

     multisend_receive_buffer[current_rbuf]->enqueue();

 #endif

 #if ENQUEUE == 1

     multisend_receive_buffer[current_rbuf]->enqueue1();

     multisend_receive_buffer[current_rbuf]->enqueue2();

 #endif

 #if ENQUEUE == 2

     multisend_receive_buffer[current_rbuf]->enqueue();

     s = r = multisend_receive_buffer[current_rbuf]->nsend_cell_ = 0;


     multisend_receive_buffer[current_rbuf]->phase2_nsend_cell_ = 0;

     multisend_receive_buffer[current_rbuf]->phase2_nsend_ = 0;


     enq2_find_time_ = 0;

     enq2_enqueue_time_ = 0;

 #endif  // ENQUEUE == 2

 //  wt1_ = nrn_wtime() - w2;

 //  wt_ = w1;

 #if MULTISEND_INTERVAL == 2

     // printf("%d reverse buffers %g\n", nrnmpi_myid, t);

     if (n_multisend_interval == 2) {

         current_rbuf = next_rbuf;

         next_rbuf = ((next_rbuf + 1) & 1);

     }

 #endif

 }


 void nrn_multisend_cleanup() {

     if (targets_phase1_) {

         delete[] targets_phase1_;

         targets_phase1_ = nullptr;

     }


     if (targets_phase2_) {

         delete[] targets_phase2_;

         targets_phase2_ = nullptr;

     }


     // cleanup MultisendReceiveBuffer here as well

 }


 void nrn_multisend_setup() {

     nrn_multisend_cleanup();

     if (!use_multisend_) {

         return;

     }

     nrnmpi_multisend_comm();

     // if (nrnmpi_myid == 0) printf("multisend_setup()\n");

     // although we only care about the set of hosts that gid2out_

     // sends spikes to (source centric). We do not want to send

     // the entire list of gid2in (which may be 10000 times larger

     // than gid2out) from every machine to every machine.

     // so we accomplish the task in two phases the first of which

     // involves allgather with a total receive buffer size of number

     // of cells (even that is too large and we will split it up

     // into chunks). And the second, an

     // allreduce with receive buffer size of number of hosts.

     max_ntarget_host = 0;

     max_multisend_targets = 0;


     // completely new algorithm does one and two phase.

     nrn_multisend_setup_targets(use_phase2_, targets_phase1_, targets_phase2_);


     if (!multisend_receive_buffer[0]) {

         multisend_receive_buffer[0] = new Multisend_ReceiveBuffer();

     }

 #if MULTISEND_INTERVAL == 2

     if (n_multisend_interval == 2 && !multisend_receive_buffer[1]) {

         multisend_receive_buffer[1] = new Multisend_ReceiveBuffer();

     }

 #endif

 }

 #endif  // NRN_MULTISEND

 }  // namespace coreneuron

nrnmpi_barrier
static void nrnmpi_barrier()
Definition: bbsavestate.cpp:228

Multisend_ReceiveBuffer
Definition: multisend.cpp:102

Multisend_ReceiveBuffer::init
void init(int index)
Definition: multisend.cpp:185

Multisend_ReceiveBuffer::incoming
void incoming(int gid, double spiketime)
Definition: multisend.cpp:196

Multisend_ReceiveBuffer::phase2_nsend_cell_
int phase2_nsend_cell_
Definition: multisend.cpp:128

Multisend_ReceiveBuffer::Multisend_ReceiveBuffer
Multisend_ReceiveBuffer()
Definition: multisend.cpp:161

Multisend_ReceiveBuffer::maxcount_
int maxcount_
Definition: multisend.cpp:112

Multisend_ReceiveBuffer::busy_
int busy_
Definition: multisend.cpp:113

Multisend_ReceiveBuffer::phase2send
void phase2send()
Definition: multisend.cpp:302

Multisend_ReceiveBuffer::phase2_head_
int phase2_head_
Definition: multisend.cpp:126

Multisend_ReceiveBuffer::nsend_cell_
int nsend_cell_
Definition: multisend.cpp:115

Multisend_ReceiveBuffer::enqueue
void enqueue()
Definition: multisend.cpp:223

Multisend_ReceiveBuffer::nrecv_
int nrecv_
Definition: multisend.cpp:114

Multisend_ReceiveBuffer::phase2_nsend_
int phase2_nsend_
Definition: multisend.cpp:128

Multisend_ReceiveBuffer::nsend_
int nsend_
Definition: multisend.cpp:114

Multisend_ReceiveBuffer::~Multisend_ReceiveBuffer
virtual ~Multisend_ReceiveBuffer()
Definition: multisend.cpp:174

Multisend_ReceiveBuffer::size_
int size_
Definition: multisend.cpp:110

Multisend_ReceiveBuffer::buffer_
NRNMPI_Spike ** buffer_
Definition: multisend.cpp:117

Multisend_ReceiveBuffer::phase2_buffer_
Phase2Buffer * phase2_buffer_
Definition: multisend.cpp:129

Multisend_ReceiveBuffer::psbuf_
PreSyn ** psbuf_
Definition: multisend.cpp:124

Multisend_ReceiveBuffer::count_
int count_
Definition: multisend.cpp:111

Multisend_ReceiveBuffer::phase2_tail_
int phase2_tail_
Definition: multisend.cpp:127

Multisend_ReceiveBuffer::index_
int index_
Definition: multisend.cpp:109

PreSyn
Definition: netcon.h:258

PreSyn::output_index_
int output_index_
Definition: netcon.h:308

PreSyn::send
virtual void send(double sendtime, NetCvode *, NrnThread *)
Definition: netcvode.cpp:3016

coreneuron::InputPreSyn
Definition: netcon.hpp:130

cnt
#define cnt
Definition: tqueue.hpp:44

i
#define i
Definition: md1redef.h:19

assert
#define assert(ex)
Definition: hocassrt.h:24

ncons
static int ncons
Definition: kinetic.cpp:456

init
void init()
Definition: init.cpp:141

multicore.hpp

multisend.hpp

coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12

coreneuron::nrn_threads
NrnThread * nrn_threads
Definition: multicore.cpp:56

coreneuron::use_phase2_
bool use_phase2_
Definition: multisend.cpp:54

coreneuron::nrn_multisend_send
void nrn_multisend_send(PreSyn *, double t, NrnThread *)

coreneuron::t
double t
Definition: register_mech.cpp:23

coreneuron::gid2in
std::map< int, InputPreSyn * > gid2in
Definition: nrn_setup.cpp:160

coreneuron::use_multisend_
bool use_multisend_
Definition: multisend.cpp:53

coreneuron::n_multisend_interval
int n_multisend_interval
Definition: multisend.cpp:55

coreneuron::nrn_multisend_receive
void nrn_multisend_receive(NrnThread *)

coreneuron::nrn_multisend_setup_targets
void nrn_multisend_setup_targets(bool use_phase2, int *&targets_phase1, int *&targets_phase2)

coreneuron::nrn_multisend_advance
void nrn_multisend_advance()

coreneuron::net_cvode_instance
NetCvode * net_cvode_instance
Definition: netcvode.cpp:35

netcon.hpp

netcvode.hpp

nrn_assert
#define nrn_assert(x)
assert()-like macro, independent of NDEBUG status
Definition: nrn_assert.h:33

j
size_t j
Definition: nrngsl_real_radix2.cpp:50

MULTISEND_RECEIVEBUFFER_SIZE
#define MULTISEND_RECEIVEBUFFER_SIZE
Definition: multisend.cpp:101

nrn_multisend_setup
void nrn_multisend_setup()
Definition: multisend.cpp:617

multisend_receive_buffer
static Multisend_ReceiveBuffer * multisend_receive_buffer[2]
Definition: multisend.cpp:156

s
s
Definition: multisend.cpp:521

nrnmpi_multisend_comm
void nrnmpi_multisend_comm()

PHASE2BUFFER_MASK
#define PHASE2BUFFER_MASK
Definition: multisend.cpp:91

nrn_multisend_init
static void nrn_multisend_init()
Definition: multisend.cpp:375

nrnmpi_multisend_single_advance
int nrnmpi_multisend_single_advance(NRNMPI_Spike *)

nrn_multisend_cleanup
static void nrn_multisend_cleanup()
Definition: multisend.cpp:566

ENQUEUE
#define ENQUEUE
Definition: multisend.cpp:83

multisend_advance
static int multisend_advance()
Definition: multisend.cpp:389

next_rbuf
static int next_rbuf
Definition: multisend.cpp:157

max_multisend_targets
static int max_multisend_targets
Definition: multisend.cpp:317

enq2_enqueue_time_
static unsigned long enq2_enqueue_time_
Definition: multisend.cpp:87

nrnmpi_multisend_conserve
int nrnmpi_multisend_conserve(int nsend, int nrecv)

current_rbuf
static int current_rbuf
Definition: multisend.cpp:157

use_phase2_
static int use_phase2_
Definition: multisend.cpp:132

max_ntarget_host
static int max_ntarget_host
Definition: multisend.cpp:313

enq2_find_time_
static unsigned long enq2_find_time_
Definition: multisend.cpp:86

if
if(n_multisend_interval==2)
Definition: multisend.cpp:534

phase2_nsend_
multisend_receive_buffer[current_rbuf] phase2_nsend_
Definition: multisend.cpp:523

enqueue
multisend_receive_buffer[current_rbuf] enqueue()

phase2_nsend_cell_
multisend_receive_buffer[current_rbuf] phase2_nsend_cell_
Definition: multisend.cpp:522

PHASE2BUFFER_SIZE
#define PHASE2BUFFER_SIZE
Definition: multisend.cpp:90

n_multisend_interval
static int n_multisend_interval
Definition: netpar.cpp:32

nrniv_decl.h

index
short index
Definition: cabvars.h:11

NRNMPI_Spike
Definition: nrnmpi.h:16

NRNMPI_Spike::spiketime
double spiketime
Definition: nrnmpi.h:18

NRNMPI_Spike::gid
int gid
Definition: nrnmpi.h:17

NrnThread
Represent main neuron object computed by single thread.
Definition: multicore.h:58

Phase2Buffer
Definition: multisend.cpp:92

Phase2Buffer::ps
PreSyn * ps
Definition: multisend.cpp:93

Phase2Buffer::spiketime
double spiketime
Definition: multisend.cpp:94