Context Navigation

source: git/src/matrix.c @ 5bb3dc4

Visit:

stereo-2025

Last change on this file since 5bb3dc4 was 5bb3dc4, checked in by Olly Betts <olly@…>, 12 months ago
Declare some variables at point of initialisation
Property mode set to `100644`
File size: 12.7 KB

Rev	Line
[421b7d2]	1	/* matrix.c
[d1b1380]	2	* Matrix building and solving routines
[a4adf09]	3	* Copyright (C) 1993-2003,2010,2013 Olly Betts
[846746e]	4	*
[89231c4]	5	* This program is free software; you can redistribute it and/or modify
	6	* it under the terms of the GNU General Public License as published by
	7	* the Free Software Foundation; either version 2 of the License, or
	8	* (at your option) any later version.
[846746e]	9	*
	10	* This program is distributed in the hope that it will be useful,
	11	* but WITHOUT ANY WARRANTY; without even the implied warranty of
[89231c4]	12	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	13	* GNU General Public License for more details.
[846746e]	14	*
[89231c4]	15	* You should have received a copy of the GNU General Public License
	16	* along with this program; if not, write to the Free Software
[ecbc6c18]	17	* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
[d1b1380]	18	*/
	19
[2164fa4]	20	/#define SOR 1/
[702f518]	21
[032ed06]	22	#if 0
	23	# define DEBUG_INVALID 1
	24	#endif
	25
[4c83f84]	26	#include <config.h>
[d1b1380]	27
	28	#include "debug.h"
[a420b49]	29	#include "cavern.h"
[c082b69]	30	#include "filename.h"
	31	#include "message.h"
[d1b1380]	32	#include "netbits.h"
	33	#include "matrix.h"
	34	#include "out.h"
	35
	36	#undef PRINT_MATRICES
	37	#define PRINT_MATRICES 0
	38
	39	#undef DEBUG_MATRIX_BUILD
	40	#define DEBUG_MATRIX_BUILD 0
	41
	42	#undef DEBUG_MATRIX
	43	#define DEBUG_MATRIX 0
	44
	45	#if PRINT_MATRICES
[9965b2b]	46	static void print_matrix(real M, real B, long n);
[d1b1380]	47	#endif
	48
[9965b2b]	49	static void choleski(real M, real B, long n);
[3fde384f]	50
[d1b1380]	51	#ifdef SOR
[9965b2b]	52	static void sor(real M, real B, long n);
[d1b1380]	53	#endif
	54
[a420b49]	55	/* for M(row, col) col must be <= row, so Y <= X */
[9965b2b]	56	# define M(X, Y) ((real )M)[((((OSSIZE_T)(X)) ((X) + 1)) >> 1) + (Y)]
[421b7d2]	57	/* +(Y>X?0printf("row<col (line %d)\n",__LINE__):0) /
[9965b2b]	58	/#define M_(X, Y) ((real )M)[((((OSSIZE_T)(Y)) * ((Y) + 1)) >> 1) + (X)]*/
[d1b1380]	59
[a420b49]	60	static int find_stn_in_tab(node *stn);
	61	static int add_stn_to_tab(node *stn);
[eb18f4d]	62	static void build_matrix(node *list);
[d1b1380]	63
	64	static long n_stn_tab;
	65
[c19f129]	66	static pos **stn_tab;
[d1b1380]	67
[032ed06]	68	extern void
[d9b5db53]	69	solve_matrix(node *list)
[032ed06]	70	{
	71	node *stn;
[702f518]	72	long n = 0;
[d9b5db53]	73	FOR_EACH_STN(stn, list) {
[032ed06]	74	if (!fixed(stn)) n++;
	75	}
	76	if (n == 0) return;
	77
	78	/* we just need n to be a reasonable estimate >= the number
	79	* of stations left after reduction. If memory is
	80	* plentiful, we can be crass.
	81	*/
[66de220]	82	stn_tab = osmalloc((OSSIZE_T)(n * ossizeof(pos*)));
[4f613e0]	83	n_stn_tab = 0;
[cb3d1e2]	84
[d9b5db53]	85	FOR_EACH_STN(stn, list) {
[032ed06]	86	if (!fixed(stn)) add_stn_to_tab(stn);
	87	}
	88
[66de220]	89	if (n_stn_tab < n) {
	90	/* release unused entries in stn_tab */
	91	stn_tab = osrealloc(stn_tab, n_stn_tab * ossizeof(pos*));
	92	}
[cb3d1e2]	93
[eb18f4d]	94	build_matrix(list);
[2c9c3ff]	95	#if DEBUG_MATRIX
[2164fa4]	96	FOR_EACH_STN(stn, list) {
[2aa930f]	97	printf("(%8.2f, %8.2f, %8.2f ) ", POS(stn, 0), POS(stn, 1), POS(stn, 2));
[2164fa4]	98	print_prefix(stn->name);
[2aa930f]	99	putnl();
[2164fa4]	100	}
[2c9c3ff]	101	#endif
[4f613e0]	102
	103	osfree(stn_tab);
[032ed06]	104	}
[d1b1380]	105
[3fde384f]	106	#ifdef NO_COVARIANCES
[702f518]	107	# define FACTOR 1
[3fde384f]	108	#else
[702f518]	109	# define FACTOR 3
[3fde384f]	110	#endif
	111
[a420b49]	112	static void
[eb18f4d]	113	build_matrix(node *list)
[a420b49]	114	{
[eb18f4d]	115	if (n_stn_tab == 0) {
[5b68ae1]	116	if (!fQuiet)
	117	puts(msg(/Network solved by reduction - no simultaneous equations to solve./74));
[dbd68203]	118	return;
	119	}
[eb18f4d]	120	/* (OSSIZE_T) cast may be needed if n_stn_tab>=181 */
[5bb3dc4]	121	real M = osmalloc((OSSIZE_T)((((OSSIZE_T)n_stn_tab FACTOR * (n_stn_tab * FACTOR + 1)) >> 1)) * ossizeof(real));
	122	real B = osmalloc((OSSIZE_T)(n_stn_tab FACTOR * ossizeof(real)));
[dbd68203]	123
[647407d]	124	if (!fQuiet) {
[a4adf09]	125	if (n_stn_tab == 1)
	126	out_current_action(msg(/Solving one equation/78));
	127	else
	128	out_current_action1(msg(/Solving %d simultaneous equations/75), n_stn_tab);
[dbd68203]	129	}
	130
[3fde384f]	131	#ifdef NO_COVARIANCES
[5bb3dc4]	132	int dim = 2;
[3fde384f]	133	#else
[5bb3dc4]	134	int dim = 0; /* fudge next loop for now */
[3fde384f]	135	#endif
[a420b49]	136	for ( ; dim >= 0; dim--) {
[2164fa4]	137	node *stn;
	138	int row;
	139
[907fe10]	140	/* Initialise M and B to zero - zeroing "linearly" will minimise
[421b7d2]	141	* paging when the matrix is large */
[66de220]	142	{
	143	int end = n_stn_tab * FACTOR;
	144	for (row = 0; row < end; row++) B[row] = (real)0.0;
	145	end = ((OSSIZE_T)n_stn_tab * FACTOR * (n_stn_tab * FACTOR + 1)) >> 1;
	146	for (row = 0; row < end; row++) M[row] = (real)0.0;
	147	}
[dbd68203]	148
[3c7ab9a]	149	/* Construct matrix by going through the stn list.
[421b7d2]	150	*
[907fe10]	151	* All legs between two fixed stations can be ignored here.
[421b7d2]	152	*
[3c7ab9a]	153	* Other legs we want to add exactly once to M. To achieve this we
	154	* wan to:
	155	*
	156	* - add forward legs between two unfixed stations,
	157	*
	158	* - add legs from unfixed stations to fixed stations (we do them from
	159	* the unfixed end so we don't need to detect when we're at a fixed
	160	* point cut line and determine which side we're currently dealing
	161	* with).
	162	*
	163	* To implement this, we only look at legs from unfixed stations and add
	164	* a leg if to a fixed station, or to an unfixed station and it's a
	165	* forward leg.
	166	*/
[d9b5db53]	167	FOR_EACH_STN(stn, list) {
[2164fa4]	168	#ifdef NO_COVARIANCES
	169	real e;
	170	#else
[dac18d8]	171	svar e;
[eb18f4d]	172	delta a;
[2164fa4]	173	#endif
[b5d3988]	174	#if DEBUG_MATRIX_BUILD
[dbd68203]	175	print_prefix(stn->name);
[b5d3988]	176	printf(" used: %d colour %ld\n",
[a420b49]	177	(!!stn->leg[2]) << 2 \| (!!stn -> leg[1]) << 1 \| (!!stn->leg[0]),
[b5d3988]	178	stn->colour);
[3fde384f]	179
[5bb3dc4]	180	for (int dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
[b5d3988]	181	#ifdef NO_COVARIANCES
[907fe10]	182	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
	183	stn->leg[dirn]->v[0], stn->leg[dirn]->l.reverse);
[b5d3988]	184	#else
[907fe10]	185	printf("Leg %d, vx=%f, reverse=%d, to ", dirn,
	186	stn->leg[dirn]->v[0][0], stn->leg[dirn]->l.reverse);
[b5d3988]	187	#endif
[907fe10]	188	print_prefix(stn->leg[dirn]->l.to->name);
	189	putnl();
	190	}
[dbd68203]	191	putnl();
[d1b1380]	192	#endif /* DEBUG_MATRIX_BUILD */
[b5d3988]	193
[907fe10]	194	if (!fixed(stn)) {
[5bb3dc4]	195	int f = find_stn_in_tab(stn);
	196	for (int dirn = 0; dirn <= 2 && stn->leg[dirn]; dirn++) {
[907fe10]	197	linkfor *leg = stn->leg[dirn];
	198	node *to = leg->l.to;
	199	if (fixed(to)) {
	200	bool fRev = !data_here(leg);
	201	if (fRev) leg = reverse_leg(leg);
	202	/* Ignore equated nodes */
[3fde384f]	203	#ifdef NO_COVARIANCES
[907fe10]	204	e = leg->v[dim];
	205	if (e != (real)0.0) {
	206	e = ((real)1.0) / e;
	207	M(f,f) += e;
[f52dcc7]	208	B[f] += e * POS(to, dim);
[907fe10]	209	if (fRev) {
[f52dcc7]	210	B[f] += leg->d[dim];
[907fe10]	211	} else {
[f52dcc7]	212	B[f] -= leg->d[dim];
[564f471]	213	}
[907fe10]	214	}
[3fde384f]	215	#else
[907fe10]	216	if (invert_svar(&e, &leg->v)) {
	217	if (fRev) {
	218	adddd(&a, &POSD(to), &leg->d);
	219	} else {
	220	subdd(&a, &POSD(to), &leg->d);
	221	}
[5bb3dc4]	222	delta b;
[907fe10]	223	mulsd(&b, &e, &a);
[5bb3dc4]	224	for (int i = 0; i < 3; i++) {
[907fe10]	225	M(f * FACTOR + i, f * FACTOR + i) += e[i];
	226	B[f * FACTOR + i] += b[i];
[564f471]	227	}
[907fe10]	228	M(f * FACTOR + 1, f * FACTOR) += e[3];
	229	M(f * FACTOR + 2, f * FACTOR) += e[4];
	230	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
	231	}
[3fde384f]	232	#endif
[907fe10]	233	} else if (data_here(leg)) {
	234	/* forward leg, unfixed -> unfixed */
[5bb3dc4]	235	int t = find_stn_in_tab(to);
[d1b1380]	236	#if DEBUG_MATRIX
[907fe10]	237	printf("Leg %d to %d, var %f, delta %f\n", f, t, e,
	238	leg->d[dim]);
[d1b1380]	239	#endif
[907fe10]	240	/* Ignore equated nodes & lollipops */
[3fde384f]	241	#ifdef NO_COVARIANCES
[907fe10]	242	e = leg->v[dim];
	243	if (t != f && e != (real)0.0) {
	244	e = ((real)1.0) / e;
	245	M(f,f) += e;
	246	M(t,t) += e;
	247	if (f < t) M(t,f) -= e; else M(f,t) -= e;
[5bb3dc4]	248	real a = e * leg->d[dim];
[907fe10]	249	B[f] -= a;
	250	B[t] += a;
	251	}
[3fde384f]	252	#else
[907fe10]	253	if (t != f && invert_svar(&e, &leg->v)) {
	254	mulsd(&a, &e, &leg->d);
[5bb3dc4]	255	for (int i = 0; i < 3; i++) {
[907fe10]	256	M(f * FACTOR + i, f * FACTOR + i) += e[i];
	257	M(t * FACTOR + i, t * FACTOR + i) += e[i];
	258	if (f < t)
	259	M(t * FACTOR + i, f * FACTOR + i) -= e[i];
	260	else
	261	M(f * FACTOR + i, t * FACTOR + i) -= e[i];
	262	B[f * FACTOR + i] -= a[i];
	263	B[t * FACTOR + i] += a[i];
	264	}
	265	M(f * FACTOR + 1, f * FACTOR) += e[3];
	266	M(t * FACTOR + 1, t * FACTOR) += e[3];
	267	M(f * FACTOR + 2, f * FACTOR) += e[4];
	268	M(t * FACTOR + 2, t * FACTOR) += e[4];
	269	M(f * FACTOR + 2, f * FACTOR + 1) += e[5];
	270	M(t * FACTOR + 2, t * FACTOR + 1) += e[5];
	271	if (f < t) {
	272	M(t * FACTOR + 1, f * FACTOR) -= e[3];
	273	M(t * FACTOR, f * FACTOR + 1) -= e[3];
	274	M(t * FACTOR + 2, f * FACTOR) -= e[4];
	275	M(t * FACTOR, f * FACTOR + 2) -= e[4];
	276	M(t * FACTOR + 2, f * FACTOR + 1) -= e[5];
	277	M(t * FACTOR + 1, f * FACTOR + 2) -= e[5];
	278	} else {
	279	M(f * FACTOR + 1, t * FACTOR) -= e[3];
	280	M(f * FACTOR, t * FACTOR + 1) -= e[3];
	281	M(f * FACTOR + 2, t * FACTOR) -= e[4];
	282	M(f * FACTOR, t * FACTOR + 2) -= e[4];
	283	M(f * FACTOR + 2, t * FACTOR + 1) -= e[5];
	284	M(f * FACTOR + 1, t * FACTOR + 2) -= e[5];
[dbd68203]	285	}
	286	}
[907fe10]	287	#endif
[564f471]	288	}
[907fe10]	289	}
[dbd68203]	290	}
[d1b1380]	291	}
	292
	293	#if PRINT_MATRICES
[eb18f4d]	294	print_matrix(M, B, n_stn_tab * FACTOR); /* 'ave a look! */
[d1b1380]	295	#endif
	296
	297	#ifdef SOR
[032ed06]	298	/* defined in network.c, may be altered by -z<letters> on command line */
[a420b49]	299	if (optimize & BITA('i'))
[eb18f4d]	300	sor(M, B, n_stn_tab * FACTOR);
[dbd68203]	301	else
[d1b1380]	302	#endif
[eb18f4d]	303	choleski(M, B, n_stn_tab * FACTOR);
[d1b1380]	304
[dbd68203]	305	{
[5bb3dc4]	306	for (int m = (int)(n_stn_tab - 1); m >= 0; m--) {
[3fde384f]	307	#ifdef NO_COVARIANCES
[c19f129]	308	stn_tab[m]->p[dim] = B[m];
[032ed06]	309	if (dim == 0) {
[4c07c51]	310	SVX_ASSERT2(pos_fixed(stn_tab[m]),
[032ed06]	311	"setting station coordinates didn't mark pos as fixed");
	312	}
[3fde384f]	313	#else
[5bb3dc4]	314	for (int i = 0; i < 3; i++) {
[c19f129]	315	stn_tab[m]->p[i] = B[m * FACTOR + i];
[702f518]	316	}
[4c07c51]	317	SVX_ASSERT2(pos_fixed(stn_tab[m]),
[032ed06]	318	"setting station coordinates didn't mark pos as fixed");
[3fde384f]	319	#endif
[a420b49]	320	}
[d1b1380]	321	#if EXPLICIT_FIXED_FLAG
[5bb3dc4]	322	for (int m = n_stn_tab - 1; m >= 0; m--) fixpos(stn_tab[m]);
[d1b1380]	323	#endif
[dbd68203]	324	}
	325	}
	326	osfree(B);
	327	osfree(M);
[d1b1380]	328	}
	329
[a420b49]	330	static int
	331	find_stn_in_tab(node *stn)
	332	{
[dbd68203]	333	int i = 0;
[eb18f4d]	334	pos *p = stn->name->pos;
	335	while (stn_tab[i] != p)
[dbd68203]	336	if (++i == n_stn_tab) {
[d1b1380]	337	#if DEBUG_INVALID
[a420b49]	338	fputs("Station ", stderr);
[eb18f4d]	339	fprint_prefix(stderr, stn->name);
	340	fputs(" not in table\n\n", stderr);
[d1b1380]	341	#endif
	342	#if 0
[dbd68203]	343	print_prefix(stn->name);
[b5d3988]	344	printf(" used: %d colour %d\n",
[dbd68203]	345	(!!stn->leg[2])<<2 \| (!!stn->leg[1])<<1 \| (!!stn->leg[0]),
[eb18f4d]	346	stn->colour);
[d1b1380]	347	#endif
[a420b49]	348	fatalerror(/Bug in program detected! Please report this to the authors/11);
[dbd68203]	349	}
	350	return i;
[d1b1380]	351	}
	352
[a420b49]	353	static int
	354	add_stn_to_tab(node *stn)
	355	{
[dbd68203]	356	int i;
[eb18f4d]	357	pos *p = stn->name->pos;
[a420b49]	358	for (i = 0; i < n_stn_tab; i++) {
[eb18f4d]	359	if (stn_tab[i] == p) return i;
[dbd68203]	360	}
[eb18f4d]	361	stn_tab[n_stn_tab++] = p;
[dbd68203]	362	return i;
[d1b1380]	363	}
	364
[702f518]	365	/* Solve MX=B for X by Choleski factorisation - modified Choleski actually
	366	* since we factor into LDL' while Choleski is just LL'
	367	*/
[d1b1380]	368	/* Note M must be symmetric positive definite */
	369	/* routine is entitled to scribble on M and B if it wishes */
[a420b49]	370	static void
[9965b2b]	371	choleski(real M, real B, long n)
[a420b49]	372	{
[5bb3dc4]	373	for (int j = 1; j < n; j++) {
[3fde384f]	374	real V;
[5bb3dc4]	375	for (int i = 0; i < j; i++) {
[421b7d2]	376	V = (real)0.0;
[5bb3dc4]	377	for (int k = 0; k < i; k++) V += M(i,k) * M(j,k) * M(k,k);
[a420b49]	378	M(j,i) = (M(j,i) - V) / M(i,i);
[dbd68203]	379	}
	380	V = (real)0.0;
[5bb3dc4]	381	for (int k = 0; k < j; k++) V += M(j,k) * M(j,k) * M(k,k);
[3fde384f]	382	M(j,j) -= V; /* may be best to add M() last for numerical reasons too */
[dbd68203]	383	}
[d1b1380]	384
[dbd68203]	385	/* Multiply x by L inverse */
[5bb3dc4]	386	for (int i = 0; i < n - 1; i++) {
	387	for (int j = i + 1; j < n; j++) {
[dbd68203]	388	B[j] -= M(j,i) * B[i];
[3fde384f]	389	}
[dbd68203]	390	}
[d1b1380]	391
[dbd68203]	392	/* Multiply x by D inverse */
[5bb3dc4]	393	for (int i = 0; i < n; i++) {
[dbd68203]	394	B[i] /= M(i,i);
[3fde384f]	395	}
	396
	397	/* Multiply x by (L transpose) inverse */
[5bb3dc4]	398	for (int i = (int)(n - 1); i > 0; i--) {
	399	for (int j = i - 1; j >= 0; j--) {
[421b7d2]	400	B[j] -= M(i,j) * B[i];
[3fde384f]	401	}
[dbd68203]	402	}
[d1b1380]	403
[dbd68203]	404	/* printf("\n%ld/%ld\n\n",flops,flopsTot); */
[d1b1380]	405	}
	406
	407	#ifdef SOR
	408	/* factor to use for SOR (must have 1 <= SOR_factor < 2) */
[702f518]	409	#define SOR_factor 1.93 /* 1.95 */
[d1b1380]	410
	411	/* Solve MX=B for X by SOR of Gauss-Siedel */
	412	/* routine is entitled to scribble on M and B if it wishes */
[a420b49]	413	static void
[9965b2b]	414	sor(real M, real B, long n)
[a420b49]	415	{
[dbd68203]	416	long it = 0;
[d1b1380]	417
[5bb3dc4]	418	real X = osmalloc(n ossizeof(real));
[d1b1380]	419
[5bb3dc4]	420	const real threshold = 0.00001;
[d1b1380]	421
[647407d]	422	printf("reciprocating diagonal\n"); /* TRANSLATE */
[d1b1380]	423
[3fde384f]	424	/* munge diagonal so we can multiply rather than divide */
[5bb3dc4]	425	for (int row = n - 1; row >= 0; row--) {
[dbd68203]	426	M(row,row) = 1 / M(row,row);
[702f518]	427	X[row] = 0;
[dbd68203]	428	}
[d1b1380]	429
[647407d]	430	printf("starting iteration\n"); /* TRANSLATE */
[d1b1380]	431
[5bb3dc4]	432	real t;
[dbd68203]	433	do {
	434	/printf("");*/
	435	it++;
	436	t = 0.0;
[5bb3dc4]	437	for (int row = 0; row < n; row++) {
	438	real x = B[row];
	439	int col;
[a420b49]	440	for (col = 0; col < row; col++) x -= M(row,col) * X[col];
	441	for (col++; col < n; col++) x -= M(col,row) * X[col];
[dbd68203]	442	x *= M(row,row);
[5bb3dc4]	443	real delta = (x - X[row]) * SOR_factor;
[dbd68203]	444	X[row] += delta;
[5bb3dc4]	445	real t2 = fabs(delta);
[dbd68203]	446	if (t2 > t) t = t2;
	447	}
[702f518]	448	printf("% 6d: %8.6f\n", it, t);
[dbd68203]	449	} while (t >= threshold && it < 100000);
[d1b1380]	450
[dbd68203]	451	if (t >= threshold) {
	452	fprintf(stderr, "not converged after %ld iterations\n", it);
	453	BUG("iteration stinks");
	454	}
[d1b1380]	455
[647407d]	456	printf("%ld iterations\n", it); /* TRANSLATE */
[d1b1380]	457
	458	#if 0
[dbd68203]	459	putnl();
[5bb3dc4]	460	for (int row = n - 1; row >= 0; row--) {
[dbd68203]	461	t = 0.0;
[5bb3dc4]	462	for (int col = 0; col < row; col++) t += M(row, col) * X[col];
[a420b49]	463	t += X[row] / M(row, row);
	464	for (col = row + 1; col < n; col++)
	465	t += M(col, row) * X[col];
[b5d3988]	466	printf("[ %f %f ]\n", t, B[row]);
[dbd68203]	467	}
[d1b1380]	468	#endif
	469
[5bb3dc4]	470	for (int row = n - 1; row >= 0; row--) B[row] = X[row];
[d1b1380]	471
[dbd68203]	472	osfree(X);
[647407d]	473	printf("\ndone\n"); /* TRANSLATE */
[dbd68203]	474	}
[d1b1380]	475	#endif
	476
	477	#if PRINT_MATRICES
[a420b49]	478	static void
[9965b2b]	479	print_matrix(real M, real B, long n)
[a420b49]	480	{
[dbd68203]	481	printf("Matrix, M and vector, B:\n");
[5bb3dc4]	482	for (long row = 0; row < n; row++) {
	483	long col;
[a420b49]	484	for (col = 0; col <= row; col++) printf("%6.2f\t", M(row, col));
	485	for (; col <= n; col++) printf(" \t");
[dbd68203]	486	printf("\t%6.2f\n", B[row]);
	487	}
	488	putnl();
	489	return;
[d1b1380]	490	}
	491	#endif

Note: See TracBrowser for help on using the repository browser.

Download in other formats: