Context Navigation

source: git/src/matrix.c @ 3c7ab9a

Visit:

stereo-2025

Last change on this file since 3c7ab9a was 3c7ab9a, checked in by Olly Betts <olly@…>, 12 months ago
Improve comment about how the matrix is built
Property mode set to `100644`
File size: 12.7 KB

Line
1	/* matrix.c
2	* Matrix building and solving routines
3	* Copyright (C) 1993-2003,2010,2013 Olly Betts
4	*
5	* This program is free software; you can redistribute it and/or modify
6	* it under the terms of the GNU General Public License as published by
7	* the Free Software Foundation; either version 2 of the License, or
8	* (at your option) any later version.
9	*
10	* This program is distributed in the hope that it will be useful,
11	* but WITHOUT ANY WARRANTY; without even the implied warranty of
12	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13	* GNU General Public License for more details.
14	*
15	* You should have received a copy of the GNU General Public License
16	* along with this program; if not, write to the Free Software
17	* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
18	*/
19
20	/#define SOR 1/
21
22	#if 0
23	# define DEBUG_INVALID 1
24	#endif
25
26	#include <config.h>
27
28	#include "debug.h"
29	#include "cavern.h"
30	#include "filename.h"
31	#include "message.h"
32	#include "netbits.h"
33	#include "matrix.h"
34	#include "out.h"
35
36	#undef PRINT_MATRICES
37	#define PRINT_MATRICES 0
38
39	#undef DEBUG_MATRIX_BUILD
40	#define DEBUG_MATRIX_BUILD 0
41
42	#undef DEBUG_MATRIX
43	#define DEBUG_MATRIX 0
44
45	#if PRINT_MATRICES
46	static void print_matrix(real M, real B, long n);
47	#endif
48
49	static void choleski(real M, real B, long n);
50
51	#ifdef SOR
52	static void sor(real M, real B, long n);
53	#endif
54
55	/* for M(row, col) col must be <= row, so Y <= X */
56	# define M(X, Y) ((real )M)[((((OSSIZE_T)(X)) ((X) + 1)) >> 1) + (Y)]
57	/* +(Y>X?0printf("row<col (line %d)\n",__LINE__):0) /
58	/#define M_(X, Y) ((real )M)[((((OSSIZE_T)(Y)) * ((Y) + 1)) >> 1) + (X)]*/
59
60	static int find_stn_in_tab(node *stn);
61	static int add_stn_to_tab(node *stn);
62	static void build_matrix(node *list);
63
64	static long n_stn_tab;
65
66	static pos **stn_tab;
67
68	extern void
69	solve_matrix(node *list)
70	{
71	node *stn;
72	long n = 0;
73	FOR_EACH_STN(stn, list) {
74	if (!fixed(stn)) n++;
75	}
76	if (n == 0) return;
77
78	/* we just need n to be a reasonable estimate >= the number
79	* of stations left after reduction. If memory is
80	* plentiful, we can be crass.
81	*/
82	stn_tab = osmalloc((OSSIZE_T)(n * ossizeof(pos*)));
83	n_stn_tab = 0;
84
85	FOR_EACH_STN(stn, list) {
86	if (!fixed(stn)) add_stn_to_tab(stn);
87	}
88
89	if (n_stn_tab < n) {
90	/* release unused entries in stn_tab */
91	stn_tab = osrealloc(stn_tab, n_stn_tab * ossizeof(pos*));
92	}
93
94	build_matrix(list);
95	#if DEBUG_MATRIX
96	FOR_EACH_STN(stn, list) {
97	printf("(%8.2f, %8.2f, %8.2f ) ", POS(stn, 0), POS(stn, 1), POS(stn, 2));
98	print_prefix(stn->name);
99	putnl();
100	}
101	#endif
102
103	osfree(stn_tab);
104	}
105
106	#ifdef NO_COVARIANCES
107	# define FACTOR 1
108	#else
109	# define FACTOR 3
110	#endif
111
112	static void
113	build_matrix(node *list)
114	{
115	real *M;
116	real *B;
117	int dim;
118
119	if (n_stn_tab == 0) {
120	if (!fQuiet)
121	puts(msg(/Network solved by reduction - no simultaneous equations to solve./74));
122	return;
123	}
124	/* (OSSIZE_T) cast may be needed if n_stn_tab>=181 */
125	M = osmalloc((OSSIZE_T)((((OSSIZE_T)n_stn_tab * FACTOR * (n_stn_tab * FACTOR + 1)) >> 1)) * ossizeof(real));
126	B = osmalloc((OSSIZE_T)(n_stn_tab * FACTOR * ossizeof(real)));
127
128	if (!fQuiet) {
129	if (n_stn_tab == 1)
130	out_current_action(msg(/Solving one equation/78));
131	else
132	out_current_action1(msg(/Solving %d simultaneous equations/75), n_stn_tab);
133	}
134
135	#ifdef NO_COVARIANCES
136	dim = 2;
137	#else
138	dim = 0; /* fudge next loop for now */
139	#endif
140	for ( ; dim >= 0; dim--) {
141	node *stn;
142	int row;
143
144	/* Initialise M and B to zero - zeroing "linearly" will minimise
145	* paging when the matrix is large */
146	{
147	int end = n_stn_tab * FACTOR;
148	for (row = 0; row < end; row++) B[row] = (real)0.0;
149	end = ((OSSIZE_T)n_stn_tab * FACTOR * (n_stn_tab * FACTOR + 1)) >> 1;
150	for (row = 0; row < end; row++) M[row] = (real)0.0;
151	}
152
153	/* Construct matrix by going through the stn list.
154	*
155	* All legs between two fixed stations can be ignored here.
156	*
157	* Other legs we want to add exactly once to M. To achieve this we
158	* wan to:
159	*
160	* - add forward legs between two unfixed stations,
161	*
162	* - add legs from unfixed stations to fixed stations (we do them from
163	* the unfixed end so we don't need to detect when we're at a fixed
164	* point cut line and determine which side we're currently dealing
165	* with).
166	*
167	* To implement this, we only look at legs from unfixed stations and add
168	* a leg if to a fixed station, or to an unfixed station and it's a
169	* forward leg.
170	*/
171	FOR_EACH_STN(stn, list) {
172	#ifdef NO_COVARIANCES
173	real e;
174	#else
175	svar e;
176	delta a;
177	#endif
178	int f, t;
179	int dirn;
180	#if DEBUG_MATRIX_BUILD
181	print_prefix(stn->name);
182	printf(" used: %d colour %ld\n",
183	(!!stn->leg[2]) << 2 \| (!!stn -> leg[1]) << 1 \| (!!stn->leg[0]),
184	stn->colour);
185
186	for (dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
187	#ifdef NO_COVARIANCES
188	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
189	stn->leg[dirn]->v[0], stn->leg[dirn]->l.reverse);
190	#else
191	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
192	stn->leg[dirn]->v[0][0], stn->leg[dirn]->l.reverse);
193	#endif
194	print_prefix(stn->leg[dirn]->l.to->name);
195	putnl();
196	}
197	putnl();
198	#endif /* DEBUG_MATRIX_BUILD */
199
200	if (!fixed(stn)) {
201	f = find_stn_in_tab(stn);
202	for (dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
203	linkfor *leg = stn->leg[dirn];
204	node *to = leg->l.to;
205	if (fixed(to)) {
206	bool fRev = !data_here(leg);
207	if (fRev) leg = reverse_leg(leg);
208	/* Ignore equated nodes */
209	#ifdef NO_COVARIANCES
210	e = leg->v[dim];
211	if (e != (real)0.0) {
212	e = ((real)1.0) / e;
213	M(f,f) += e;
214	B[f] += e * POS(to, dim);
215	if (fRev) {
216	B[f] += leg->d[dim];
217	} else {
218	B[f] -= leg->d[dim];
219	}
220	}
221	#else
222	if (invert_svar(&e, &leg->v)) {
223	delta b;
224	int i;
225	if (fRev) {
226	adddd(&a, &POSD(to), &leg->d);
227	} else {
228	subdd(&a, &POSD(to), &leg->d);
229	}
230	mulsd(&b, &e, &a);
231	for (i = 0; i < 3; i++) {
232	M(f * FACTOR + i, f * FACTOR + i) += e[i];
233	B[f * FACTOR + i] += b[i];
234	}
235	M(f * FACTOR + 1, f * FACTOR) += e[3];
236	M(f * FACTOR + 2, f * FACTOR) += e[4];
237	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
238	}
239	#endif
240	} else if (data_here(leg)) {
241	/* forward leg, unfixed -> unfixed */
242	t = find_stn_in_tab(to);
243	#if DEBUG_MATRIX
244	printf("Leg %d to %d, var %f, delta %f\n", f, t, e,
245	leg->d[dim]);
246	#endif
247	/* Ignore equated nodes & lollipops */
248	#ifdef NO_COVARIANCES
249	e = leg->v[dim];
250	if (t != f && e != (real)0.0) {
251	real a;
252	e = ((real)1.0) / e;
253	M(f,f) += e;
254	M(t,t) += e;
255	if (f < t) M(t,f) -= e; else M(f,t) -= e;
256	a = e * leg->d[dim];
257	B[f] -= a;
258	B[t] += a;
259	}
260	#else
261	if (t != f && invert_svar(&e, &leg->v)) {
262	int i;
263	mulsd(&a, &e, &leg->d);
264	for (i = 0; i < 3; i++) {
265	M(f * FACTOR + i, f * FACTOR + i) += e[i];
266	M(t * FACTOR + i, t * FACTOR + i) += e[i];
267	if (f < t)
268	M(t * FACTOR + i, f * FACTOR + i) -= e[i];
269	else
270	M(f * FACTOR + i, t * FACTOR + i) -= e[i];
271	B[f * FACTOR + i] -= a[i];
272	B[t * FACTOR + i] += a[i];
273	}
274	M(f * FACTOR + 1, f * FACTOR) += e[3];
275	M(t * FACTOR + 1, t * FACTOR) += e[3];
276	M(f * FACTOR + 2, f * FACTOR) += e[4];
277	M(t * FACTOR + 2, t * FACTOR) += e[4];
278	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
279	M(t * FACTOR + 2, t * FACTOR + 1) += e[5];
280	if (f < t) {
281	M(t * FACTOR + 1, f * FACTOR) -= e[3];
282	M(t * FACTOR, f * FACTOR + 1) -= e[3];
283	M(t * FACTOR + 2, f * FACTOR) -= e[4];
284	M(t * FACTOR, f * FACTOR + 2) -= e[4];
285	M(t * FACTOR + 2, f * FACTOR + 1) -= e[5];
286	M(t * FACTOR + 1, f * FACTOR + 2) -= e[5];
287	} else {
288	M(f * FACTOR + 1, t * FACTOR) -= e[3];
289	M(f * FACTOR, t * FACTOR + 1) -= e[3];
290	M(f * FACTOR + 2, t * FACTOR) -= e[4];
291	M(f * FACTOR, t * FACTOR + 2) -= e[4];
292	M(f * FACTOR + 2, t * FACTOR + 1) -= e[5];
293	M(f * FACTOR + 1, t * FACTOR + 2) -= e[5];
294	}
295	}
296	#endif
297	}
298	}
299	}
300	}
301
302	#if PRINT_MATRICES
303	print_matrix(M, B, n_stn_tab * FACTOR); /* 'ave a look! */
304	#endif
305
306	#ifdef SOR
307	/* defined in network.c, may be altered by -z<letters> on command line */
308	if (optimize & BITA('i'))
309	sor(M, B, n_stn_tab * FACTOR);
310	else
311	#endif
312	choleski(M, B, n_stn_tab * FACTOR);
313
314	{
315	int m;
316	for (m = (int)(n_stn_tab - 1); m >= 0; m--) {
317	#ifdef NO_COVARIANCES
318	stn_tab[m]->p[dim] = B[m];
319	if (dim == 0) {
320	SVX_ASSERT2(pos_fixed(stn_tab[m]),
321	"setting station coordinates didn't mark pos as fixed");
322	}
323	#else
324	int i;
325	for (i = 0; i < 3; i++) {
326	stn_tab[m]->p[i] = B[m * FACTOR + i];
327	}
328	SVX_ASSERT2(pos_fixed(stn_tab[m]),
329	"setting station coordinates didn't mark pos as fixed");
330	#endif
331	}
332	#if EXPLICIT_FIXED_FLAG
333	for (m = n_stn_tab - 1; m >= 0; m--) fixpos(stn_tab[m]);
334	#endif
335	}
336	}
337	osfree(B);
338	osfree(M);
339	}
340
341	static int
342	find_stn_in_tab(node *stn)
343	{
344	int i = 0;
345	pos *p = stn->name->pos;
346	while (stn_tab[i] != p)
347	if (++i == n_stn_tab) {
348	#if DEBUG_INVALID
349	fputs("Station ", stderr);
350	fprint_prefix(stderr, stn->name);
351	fputs(" not in table\n\n", stderr);
352	#endif
353	#if 0
354	print_prefix(stn->name);
355	printf(" used: %d colour %d\n",
356	(!!stn->leg[2])<<2 \| (!!stn->leg[1])<<1 \| (!!stn->leg[0]),
357	stn->colour);
358	#endif
359	fatalerror(/Bug in program detected! Please report this to the authors/11);
360	}
361	return i;
362	}
363
364	static int
365	add_stn_to_tab(node *stn)
366	{
367	int i;
368	pos *p = stn->name->pos;
369	for (i = 0; i < n_stn_tab; i++) {
370	if (stn_tab[i] == p) return i;
371	}
372	stn_tab[n_stn_tab++] = p;
373	return i;
374	}
375
376	/* Solve MX=B for X by Choleski factorisation - modified Choleski actually
377	* since we factor into LDL' while Choleski is just LL'
378	*/
379	/* Note M must be symmetric positive definite */
380	/* routine is entitled to scribble on M and B if it wishes */
381	static void
382	choleski(real M, real B, long n)
383	{
384	int i, j, k;
385
386	for (j = 1; j < n; j++) {
387	real V;
388	for (i = 0; i < j; i++) {
389	V = (real)0.0;
390	for (k = 0; k < i; k++) V += M(i,k) * M(j,k) * M(k,k);
391	M(j,i) = (M(j,i) - V) / M(i,i);
392	}
393	V = (real)0.0;
394	for (k = 0; k < j; k++) V += M(j,k) * M(j,k) * M(k,k);
395	M(j,j) -= V; /* may be best to add M() last for numerical reasons too */
396	}
397
398	/* Multiply x by L inverse */
399	for (i = 0; i < n - 1; i++) {
400	for (j = i + 1; j < n; j++) {
401	B[j] -= M(j,i) * B[i];
402	}
403	}
404
405	/* Multiply x by D inverse */
406	for (i = 0; i < n; i++) {
407	B[i] /= M(i,i);
408	}
409
410	/* Multiply x by (L transpose) inverse */
411	for (i = (int)(n - 1); i > 0; i--) {
412	for (j = i - 1; j >= 0; j--) {
413	B[j] -= M(i,j) * B[i];
414	}
415	}
416
417	/* printf("\n%ld/%ld\n\n",flops,flopsTot); */
418	}
419
420	#ifdef SOR
421	/* factor to use for SOR (must have 1 <= SOR_factor < 2) */
422	#define SOR_factor 1.93 /* 1.95 */
423
424	/* Solve MX=B for X by SOR of Gauss-Siedel */
425	/* routine is entitled to scribble on M and B if it wishes */
426	static void
427	sor(real M, real B, long n)
428	{
429	real t, x, delta, threshold, t2;
430	int row, col;
431	real *X;
432	long it = 0;
433
434	X = osmalloc(n * ossizeof(real));
435
436	threshold = 0.00001;
437
438	printf("reciprocating diagonal\n"); /* TRANSLATE */
439
440	/* munge diagonal so we can multiply rather than divide */
441	for (row = n - 1; row >= 0; row--) {
442	M(row,row) = 1 / M(row,row);
443	X[row] = 0;
444	}
445
446	printf("starting iteration\n"); /* TRANSLATE */
447
448	do {
449	/printf("");*/
450	it++;
451	t = 0.0;
452	for (row = 0; row < n; row++) {
453	x = B[row];
454	for (col = 0; col < row; col++) x -= M(row,col) * X[col];
455	for (col++; col < n; col++) x -= M(col,row) * X[col];
456	x *= M(row,row);
457	delta = (x - X[row]) * SOR_factor;
458	X[row] += delta;
459	t2 = fabs(delta);
460	if (t2 > t) t = t2;
461	}
462	printf("% 6d: %8.6f\n", it, t);
463	} while (t >= threshold && it < 100000);
464
465	if (t >= threshold) {
466	fprintf(stderr, "not converged after %ld iterations\n", it);
467	BUG("iteration stinks");
468	}
469
470	printf("%ld iterations\n", it); /* TRANSLATE */
471
472	#if 0
473	putnl();
474	for (row = n - 1; row >= 0; row--) {
475	t = 0.0;
476	for (col = 0; col < row; col++) t += M(row, col) * X[col];
477	t += X[row] / M(row, row);
478	for (col = row + 1; col < n; col++)
479	t += M(col, row) * X[col];
480	printf("[ %f %f ]\n", t, B[row]);
481	}
482	#endif
483
484	for (row = n - 1; row >= 0; row--) B[row] = X[row];
485
486	osfree(X);
487	printf("\ndone\n"); /* TRANSLATE */
488	}
489	#endif
490
491	#if PRINT_MATRICES
492	static void
493	print_matrix(real M, real B, long n)
494	{
495	long row, col;
496	printf("Matrix, M and vector, B:\n");
497	for (row = 0; row < n; row++) {
498	for (col = 0; col <= row; col++) printf("%6.2f\t", M(row, col));
499	for (; col <= n; col++) printf(" \t");
500	printf("\t%6.2f\n", B[row]);
501	}
502	putnl();
503	return;
504	}
505	#endif

Note: See TracBrowser for help on using the repository browser.

Download in other formats: