CoreNeuron/coreneuron/mechanism/mechanism.hpp at e661bf6373d13cda0b2d16be2a8209bc3b133fe9 · BlueBrain/CoreNeuron · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
/*
# =============================================================================
# Copyright (c) 2016 - 2021 Blue Brain Project/EPFL
#
# See top-level LICENSE file for details.
# =============================================================================
*/

#pragma once

#include <string.h>

#include "coreneuron/nrnconf.h"
#include "coreneuron/utils/memory.h"

namespace coreneuron {
// OpenACC with PGI compiler has issue when union is used and hence use struct
// \todo check if newer PGI versions has resolved this issue
#if defined(_OPENACC)
struct ThreadDatum {
    int i;
    double* pval;
    void* _pvoid;
};
#else
union ThreadDatum {
    double val;
    int i;
    double* pval;
    void* _pvoid;
};
#endif

/* will go away at some point */
struct Point_process {
    int _i_instance;
    short _type;
    short _tid; /* NrnThread id */
};

struct NetReceiveBuffer_t: public UnifiedMemManaged<> {
    unified_uniq_ptr<int[]> _displ;     /* _displ_cnt + 1 of these */
    unified_uniq_ptr<int[]> _nrb_index; /* _cnt of these (order of increasing _pnt_index) */

    unified_uniq_ptr<int[]> _pnt_index;
    unified_uniq_ptr<int[]> _weight_index;
    unified_uniq_ptr<double[]> _nrb_t;
    unified_uniq_ptr<double[]> _nrb_flag;
    int _cnt = 0;
    int _displ_cnt = 0; /* number of unique _pnt_index */

    std::size_t _size = 0; /* capacity */
    int _pnt_offset = 0;
    std::size_t size_of_object() {
        std::size_t nbytes = 0;
        nbytes += _size * sizeof(int) * 3;
        nbytes += (_size + 1) * sizeof(int);
        nbytes += _size * sizeof(double) * 2;
        return nbytes;
    }

    void initialize(std::size_t size) {
        _size = size;
        _pnt_index = allocate_unique<int[]>(allocator<int>{}, _size);
        auto displ_size = _size + 1;
        _displ = allocate_unique<int[]>(allocator<int>{}, displ_size);
        _nrb_index = allocate_unique<int[]>(allocator<int>{}, _size);
        _weight_index = allocate_unique<int[]>(allocator<int>{}, _size);
        _nrb_t = allocate_unique<double[]>(allocator<double>{}, _size);
        _nrb_flag = allocate_unique<double[]>(allocator<double>{}, _size);
    }

    void grow() {
        std::size_t new_size = _size * 2;
        grow_buf(_pnt_index, _size, new_size);
        grow_buf(_weight_index, _size, new_size);
        grow_buf(_nrb_t, _size, new_size);
        grow_buf(_nrb_flag, _size, new_size);
        grow_buf(_displ, _size + 1, new_size + 1);
        grow_buf(_nrb_index, _size, new_size);
        _size = new_size;
    }
};

struct NetSendBuffer_t: public UnifiedMemManaged<> {
    unified_uniq_ptr<int[]> _sendtype;  // net_send, net_event, net_move
    unified_uniq_ptr<int[]> _vdata_index;
    unified_uniq_ptr<int[]> _pnt_index;
    unified_uniq_ptr<int[]> _weight_index;
    unified_uniq_ptr<double[]> _nsb_t;
    unified_uniq_ptr<double[]> _nsb_flag;
    int _cnt = 0;
    std::size_t _size = 0; /* capacity */
    int reallocated = 0;   /* if buffer resized/reallocated, needs to be copy to cpu */

    NetSendBuffer_t(int size)
        : _size(size) {
        _cnt = 0;

        _sendtype = allocate_unique<int[]>(allocator<int>{}, _size);
        _vdata_index = allocate_unique<int[]>(allocator<int>{}, _size);
        _pnt_index = allocate_unique<int[]>(allocator<int>{}, _size);
        _weight_index = allocate_unique<int[]>(allocator<int>{}, _size);
        // when == 1, NetReceiveBuffer_t is newly allocated (i.e. we need to free previous copy
        // and recopy new data
        reallocated = 1;
        _nsb_t = allocate_unique<double[]>(allocator<double>{}, _size);
        _nsb_flag = allocate_unique<double[]>(allocator<double>{}, _size);
    }

    size_t size_of_object() {
        size_t nbytes = 0;
        nbytes += _size * sizeof(int) * 4;
        nbytes += _size * sizeof(double) * 2;
        return nbytes;
    }

    void grow() {
        std::size_t new_size = _size * 2;
        grow_buf(_sendtype, _size, new_size);
        grow_buf(_vdata_index, _size, new_size);
        grow_buf(_pnt_index, _size, new_size);
        grow_buf(_weight_index, _size, new_size);
        grow_buf(_nsb_t, _size, new_size);
        grow_buf(_nsb_flag, _size, new_size);
        _size = new_size;
    }
};

struct Memb_list {
    /* nodeindices contains all nodes this extension is responsible for,
     * ordered according to the matrix. This allows to access the matrix
     * directly via the nrn_actual_* arrays instead of accessing it in the
     * order of insertion and via the node-structure, making it more
     * cache-efficient */
    int* nodeindices = nullptr;
    int* _permute = nullptr;
    double* data = nullptr;
    Datum* pdata = nullptr;
    ThreadDatum* _thread = nullptr; /* thread specific data (when static is no good) */
    NetReceiveBuffer_t* _net_receive_buffer = nullptr;
    NetSendBuffer_t* _net_send_buffer = nullptr;
    int nodecount; /* actual node count */
    int _nodecount_padded;
    void* instance{nullptr}; /* mechanism instance struct */
    // nrn_acc_manager.cpp handles data movement to/from the accelerator as the
    // "private constructor" in the translated MOD file code is called before
    // the main nrn_acc_manager methods that copy thread/mechanism data to the
    // device
    void* global_variables{nullptr};
    std::size_t global_variables_size{};
};
}  // namespace coreneuron