CoreNEURON
crout_thread.hpp
Go to the documentation of this file.
1 /*
2 # =============================================================================
3 # Originally crout.c from SCoP library, Copyright (c) 1987-90 Duke University
4 # =============================================================================
5 # Subsequent extensive prototype and memory layout changes for CoreNEURON
6 #
7 # Copyright (c) 2016 - 2022 Blue Brain Project/EPFL
8 #
9 # See top-level LICENSE file for details.
10 # =============================================================================.
11 */
12 #pragma once
15 
16 namespace coreneuron {
17 #if defined(scopmath_crout_ix) || defined(scopmath_crout_y) || defined(scopmath_crout_b)
18 #error "naming clash on crout_thread.hpp-internal macros"
19 #endif
20 #define scopmath_crout_b(arg) b[scopmath_crout_ix(arg)]
21 #define scopmath_crout_ix(arg) ((arg) *_STRIDE)
22 #define scopmath_crout_y(arg) _p[y[arg] * _STRIDE]
23 
24 /**
25  * Performs an LU triangular factorization of a real matrix by the Crout
26  * algorithm using partial pivoting. Rows are not normalized; implicit
27  * equilibration is used. ROUNDOFF is the minimal value for a pivot element
28  * without its being considered too close to zero (currently set to 1.0E-20).
29  *
30  * @return 0 if no error; 2 if matrix is singular or ill-conditioned
31  * @param n number of rows of the matrix
32  * @param a double precision matrix to be factored
33  * @param[out] a factors required to transform the constant vector in the set of
34  * simultaneous equations are stored in the lower triangle;
35  * factors for back substitution are stored in the upper triangle.
36  * @param[out] perm permutation vector to store row interchanges
37  *
38  * @note Having a differnt permutation per instance may not be a good idea.
39  */
40 inline int nrn_crout_thread(NewtonSpace* ns, int n, double** a, int* perm, _threadargsproto_) {
41  int save_i = 0;
42 
43  /* Initialize permutation and rowmax vectors */
44  double* rowmax = ns->rowmax;
45  for (int i = 0; i < n; i++) {
46  perm[scopmath_crout_ix(i)] = i;
47  int k = 0;
48  for (int j = 1; j < n; j++)
49  if (fabs(a[i][scopmath_crout_ix(j)]) > fabs(a[i][scopmath_crout_ix(k)]))
50  k = j;
51  rowmax[scopmath_crout_ix(i)] = a[i][scopmath_crout_ix(k)];
52  }
53 
54  /* Loop over rows and columns r */
55  for (int r = 0; r < n; r++) {
56  /*
57  * Operate on rth column. This produces the lower triangular matrix
58  * of terms needed to transform the constant vector.
59  */
60 
61  for (int i = r; i < n; i++) {
62  double sum = 0.0;
63  int irow = perm[scopmath_crout_ix(i)];
64  for (int k = 0; k < r; k++) {
65  int krow = perm[scopmath_crout_ix(k)];
66  sum += a[irow][scopmath_crout_ix(k)] * a[krow][scopmath_crout_ix(r)];
67  }
68  a[irow][scopmath_crout_ix(r)] -= sum;
69  }
70 
71  /* Find row containing the pivot in the rth column */
72  int pivot = perm[scopmath_crout_ix(r)];
73  double equil_1 = fabs(a[pivot][scopmath_crout_ix(r)] / rowmax[scopmath_crout_ix(pivot)]);
74  for (int i = r + 1; i < n; i++) {
75  int irow = perm[scopmath_crout_ix(i)];
76  double equil_2 = fabs(a[irow][scopmath_crout_ix(r)] / rowmax[scopmath_crout_ix(irow)]);
77  if (equil_2 > equil_1) {
78  /* make irow the new pivot row */
79 
80  pivot = irow;
81  save_i = i;
82  equil_1 = equil_2;
83  }
84  }
85 
86  /* Interchange entries in permutation vector if necessary */
87  if (pivot != perm[scopmath_crout_ix(r)]) {
88  perm[scopmath_crout_ix(save_i)] = perm[scopmath_crout_ix(r)];
89  perm[scopmath_crout_ix(r)] = pivot;
90  }
91 
92  /* Check that pivot element is not too small */
93  if (fabs(a[pivot][scopmath_crout_ix(r)]) < ROUNDOFF)
94  return SINGULAR;
95 
96  /*
97  * Operate on row in rth position. This produces the upper
98  * triangular matrix whose diagonal elements are assumed to be unity.
99  * This matrix is used in the back substitution algorithm.
100  */
101  for (int j = r + 1; j < n; j++) {
102  double sum = 0.0;
103  for (int k = 0; k < r; k++) {
104  int krow = perm[scopmath_crout_ix(k)];
105  sum += a[pivot][scopmath_crout_ix(k)] * a[krow][scopmath_crout_ix(j)];
106  }
107  a[pivot][scopmath_crout_ix(j)] = (a[pivot][scopmath_crout_ix(j)] - sum) /
108  a[pivot][scopmath_crout_ix(r)];
109  }
110  }
111  return SUCCESS;
112 }
113 
114 /**
115  * Performs forward substitution algorithm to transform the constant vector in
116  * the linear simultaneous equations to be consistent with the factored matrix.
117  * Then performs back substitution to find the solution to the simultaneous
118  * linear equations.
119  *
120  * @param n number of rows of the matrix
121  * @param a double precision matrix containing the factored matrix of
122  * coefficients of the linear equations
123  * @param b vector of function values
124  * @param perm permutation vector to store row interchanges
125  * @param[out] p[y[i]] contains the solution vector
126  */
127 inline void nrn_scopmath_solve_thread(int n,
128  double** a,
129  double* b,
130  int* perm,
131  double* p,
132  int* y,
134  /* Perform forward substitution with pivoting */
135  // if (y) { // pgacc bug. nullptr on cpu but not on GPU
136  if (0) {
137  for (int i = 0; i < n; i++) {
138  int pivot = perm[scopmath_crout_ix(i)];
139  double sum = 0.0;
140  for (int j = 0; j < i; j++)
141  sum += a[pivot][scopmath_crout_ix(j)] * (scopmath_crout_y(j));
142  scopmath_crout_y(i) = (scopmath_crout_b(pivot) - sum) / a[pivot][scopmath_crout_ix(i)];
143  }
144 
145  /*
146  * Note that the y vector is already in the correct order for back
147  * substitution. Perform back substitution, pivoting the matrix but not
148  * the y vector. There is no need to divide by the diagonal element as
149  * this is assumed to be unity.
150  */
151 
152  for (int i = n - 1; i >= 0; i--) {
153  int pivot = perm[scopmath_crout_ix(i)];
154  double sum = 0.0;
155  for (int j = i + 1; j < n; j++)
156  sum += a[pivot][scopmath_crout_ix(j)] * (scopmath_crout_y(j));
157  scopmath_crout_y(i) -= sum;
158  }
159  } else {
160  for (int i = 0; i < n; i++) {
161  int pivot = perm[scopmath_crout_ix(i)];
162  double sum = 0.0;
163  if (i > 0) { // pgacc bug. with i==0 the following loop executes once
164  for (int j = 0; j < i; j++) {
165  sum += a[pivot][scopmath_crout_ix(j)] * (p[scopmath_crout_ix(j)]);
166  }
167  }
168  p[scopmath_crout_ix(i)] = (scopmath_crout_b(pivot) - sum) /
169  a[pivot][scopmath_crout_ix(i)];
170  }
171 
172  /*
173  * Note that the y vector is already in the correct order for back
174  * substitution. Perform back substitution, pivoting the matrix but not
175  * the y vector. There is no need to divide by the diagonal element as
176  * this is assumed to be unity.
177  */
178  for (int i = n - 1; i >= 0; i--) {
179  int pivot = perm[scopmath_crout_ix(i)];
180  double sum = 0.0;
181  for (int j = i + 1; j < n; j++)
182  sum += a[pivot][scopmath_crout_ix(j)] * (p[scopmath_crout_ix(j)]);
183  p[scopmath_crout_ix(i)] -= sum;
184  }
185  }
186 }
187 #undef scopmath_crout_b
188 #undef scopmath_crout_ix
189 #undef scopmath_crout_y
190 } // namespace coreneuron
scopmath_crout_ix
#define scopmath_crout_ix(arg)
Definition: crout_thread.hpp:21
ROUNDOFF
#define ROUNDOFF
Definition: errcodes.h:31
coreneuron::nrn_scopmath_solve_thread
void nrn_scopmath_solve_thread(int n, double **a, double *b, int *perm, double *p, int *y, _threadargsproto_)
Performs forward substitution algorithm to transform the constant vector in the linear simultaneous e...
Definition: crout_thread.hpp:127
coreneuron::NewtonSpace
Definition: newton_struct.h:14
scopmath_crout_b
#define scopmath_crout_b(arg)
Definition: crout_thread.hpp:20
SUCCESS
#define SUCCESS
Definition: errcodes.h:48
coreneuron::nrn_crout_thread
int nrn_crout_thread(NewtonSpace *ns, int n, double **a, int *perm, _threadargsproto_)
Performs an LU triangular factorization of a real matrix by the Crout algorithm using partial pivotin...
Definition: crout_thread.hpp:40
coreneuron
THIS FILE IS AUTO GENERATED DONT MODIFY IT.
Definition: corenrn_parameters.cpp:12
coreneuron::i
int i
Definition: cellorder.cpp:485
SINGULAR
#define SINGULAR
Definition: errcodes.h:50
newton_struct.h
_threadargsproto_
#define _threadargsproto_
Definition: mod2c_core_thread.hpp:24
scopmath_crout_y
#define scopmath_crout_y(arg)
Definition: crout_thread.hpp:22
errcodes.h
coreneuron::NewtonSpace::rowmax
double * rowmax
Definition: newton_struct.h:22